diff --git a/.gitattributes b/.gitattributes
index a6344aac8c09253b3b630fb776ae94478aa0275b..52373fe24473b1aa44333d318f578ae6bf04b49b 100644
--- a/.gitattributes
+++ b/.gitattributes
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
*.zip filter=lfs diff=lfs merge=lfs -text
*.zst filter=lfs diff=lfs merge=lfs -text
*tfevents* filter=lfs diff=lfs merge=lfs -text
+tokenizer.json filter=lfs diff=lfs merge=lfs -text
diff --git a/README.md b/README.md
new file mode 100644
index 0000000000000000000000000000000000000000..4c192fb495da2b7b34030deda13f226c99060650
--- /dev/null
+++ b/README.md
@@ -0,0 +1,57 @@
+---
+language:
+- en
+- zh
+library_name: transformers
+license: mit
+pipeline_tag: text-generation
+---
+
+# GLM-4.6-FP8
+
+
+

+
+
+ ๐ Join our Discord community.
+
+ ๐ Check out the GLM-4.6 technical blog, technical report(GLM-4.5), and Zhipu AI technical documentation.
+
+ ๐ Use GLM-4.6 API services on Z.ai API Platform.
+
+ ๐ One click to GLM-4.6.
+
+
+## Model Introduction
+
+Compared with GLM-4.5, **GLM-4.6** brings several key improvements:
+
+* **Longer context window:** The context window has been expanded from 128K to 200K tokens, enabling the model to handle more complex agentic tasks.
+* **Superior coding performance:** The model achieves higher scores on code benchmarks and demonstrates better real-world performance in applications such as Claude CodeใClineใRoo Code and Kilo Code, including improvements in generating visually polished front-end pages.
+* **Advanced reasoning:** GLM-4.6 shows a clear improvement in reasoning performance and supports tool use during inference, leading to stronger overall capability.
+* **More capable agents:** GLM-4.6 exhibits stronger performance in tool using and search-based agents, and integrates more effectively within agent frameworks.
+* **Refined writing:** Better aligns with human preferences in style and readability, and performs more naturally in role-playing scenarios.
+
+We evaluated GLM-4.6 across eight public benchmarks covering agents, reasoning, and coding. Results show clear gains over GLM-4.5, with GLM-4.6 also holding competitive advantages over leading domestic and international models such as **DeepSeek-V3.1-Terminus** and **Claude Sonnet 4**.
+
+
+
+## Inference
+
+**Both GLM-4.5 and GLM-4.6 use the same inference method.**
+
+you can check our [github](https://github.com/zai-org/GLM-4.5) for more detail.
+
+## Recommended Evaluation Parameters
+
+For general evaluations, we recommend using a **sampling temperature of 1.0**.
+
+For **code-related evaluation tasks** (such as LCB), it is further recommended to set:
+
+- `top_p = 0.95`
+- `top_k = 40`
+
+## Evaluation
+
+- For tool-integrated reasoning, please refer to [this doc](https://github.com/zai-org/GLM-4.5/blob/main/resources/glm_4.6_tir_guide.md).
+- For search benchmark, we design a specific format for searching toolcall in thinking mode to support search agent, please refer to [this](https://github.com/zai-org/GLM-4.5/blob/main/resources/trajectory_search.json). for the detailed template.
diff --git a/chat_template.jinja b/chat_template.jinja
new file mode 100644
index 0000000000000000000000000000000000000000..41478957aca7a04b7321022e7d1f73de5badd995
--- /dev/null
+++ b/chat_template.jinja
@@ -0,0 +1,103 @@
+[gMASK]
+{%- if tools -%}
+<|system|>
+# Tools
+
+You may call one or more functions to assist with the user query.
+
+You are provided with function signatures within XML tags:
+
+{% for tool in tools %}
+{{ tool | tojson(ensure_ascii=False) }}
+{% endfor %}
+
+
+For each function call, output the function name and arguments within the following XML format:
+{function-name}
+{arg-key-1}
+{arg-value-1}
+{arg-key-2}
+{arg-value-2}
+...
+{%- endif -%}
+{%- macro visible_text(content) -%}
+ {%- if content is string -%}
+ {{- content }}
+ {%- elif content is iterable and content is not mapping -%}
+ {%- for item in content -%}
+ {%- if item is mapping and item.type == 'text' -%}
+ {{- item.text }}
+ {%- elif item is string -%}
+ {{- item }}
+ {%- endif -%}
+ {%- endfor -%}
+ {%- else -%}
+ {{- content }}
+ {%- endif -%}
+{%- endmacro -%}
+{%- set ns = namespace(last_user_index=-1) %}
+{%- for m in messages %}
+ {%- if m.role == 'user' %}
+ {% set ns.last_user_index = loop.index0 -%}
+ {%- endif %}
+{%- endfor %}
+{% for m in messages %}
+{%- if m.role == 'user' -%}<|user|>
+{{ visible_text(m.content) }}
+{{- '/nothink' if (enable_thinking is defined and not enable_thinking and not visible_text(m.content).endswith("/nothink")) else '' -}}
+{%- elif m.role == 'assistant' -%}
+<|assistant|>
+{%- set reasoning_content = '' %}
+{%- set content = visible_text(m.content) %}
+{%- if m.reasoning_content is string %}
+ {%- set reasoning_content = m.reasoning_content %}
+{%- else %}
+ {%- if '' in content %}
+ {%- set reasoning_content = content.split('')[0].rstrip('\n').split('')[-1].lstrip('\n') %}
+ {%- set content = content.split('')[-1].lstrip('\n') %}
+ {%- endif %}
+{%- endif %}
+{%- if loop.index0 > ns.last_user_index and reasoning_content -%}
+{{ '\n' + reasoning_content.strip() + ''}}
+{%- else -%}
+{{ '\n' }}
+{%- endif -%}
+{%- if content.strip() -%}
+{{ '\n' + content.strip() }}
+{%- endif -%}
+{% if m.tool_calls %}
+{% for tc in m.tool_calls %}
+{%- if tc.function %}
+ {%- set tc = tc.function %}
+{%- endif %}
+{{ '\n' + tc.name }}
+{% set _args = tc.arguments %}
+{% for k, v in _args.items() %}
+{{ k }}
+{{ v | tojson(ensure_ascii=False) if v is not string else v }}
+{% endfor %}
+{% endfor %}
+{% endif %}
+{%- elif m.role == 'tool' -%}
+{%- if m.content is string -%}
+{%- if loop.first or (messages[loop.index0 - 1].role != "tool") %}
+ {{- '<|observation|>' }}
+{%- endif %}
+{{- '\n\n' }}
+{{- m.content }}
+{{- '\n' }}
+{%- else -%}
+<|observation|>{% for tr in m.content %}
+
+
+{{ tr.output if tr.output is defined else tr }}
+{% endfor -%}
+{% endif -%}
+{%- elif m.role == 'system' -%}
+<|system|>
+{{ visible_text(m.content) }}
+{%- endif -%}
+{%- endfor -%}
+{%- if add_generation_prompt -%}
+ <|assistant|>{{- '\n' if (enable_thinking is defined and not enable_thinking) else '' -}}
+{%- endif -%}
\ No newline at end of file
diff --git a/config.json b/config.json
new file mode 100644
index 0000000000000000000000000000000000000000..18b50c45ccc5ccc466fc9527f33abc0b1515a9d5
--- /dev/null
+++ b/config.json
@@ -0,0 +1,43 @@
+{
+ "architectures": [
+ "Glm4MoeForCausalLM"
+ ],
+ "attention_bias": true,
+ "attention_dropout": 0.0,
+ "eos_token_id": [
+ 151329,
+ 151336,
+ 151338
+ ],
+ "first_k_dense_replace": 3,
+ "head_dim": 128,
+ "hidden_act": "silu",
+ "hidden_size": 5120,
+ "initializer_range": 0.02,
+ "intermediate_size": 12288,
+ "max_position_embeddings": 202752,
+ "model_type": "glm4_moe",
+ "moe_intermediate_size": 1536,
+ "n_group": 1,
+ "n_routed_experts": 160,
+ "n_shared_experts": 1,
+ "norm_topk_prob": true,
+ "num_attention_heads": 96,
+ "num_experts_per_tok": 8,
+ "num_hidden_layers": 92,
+ "num_key_value_heads": 8,
+ "num_nextn_predict_layers": 1,
+ "pad_token_id": 151329,
+ "partial_rotary_factor": 0.5,
+ "rms_norm_eps": 1e-05,
+ "rope_scaling": null,
+ "rope_theta": 1000000,
+ "routed_scaling_factor": 2.5,
+ "tie_word_embeddings": false,
+ "topk_group": 1,
+ "torch_dtype": "bfloat16",
+ "transformers_version": "4.54.0",
+ "use_cache": true,
+ "use_qk_norm": true,
+ "vocab_size": 151552
+}
\ No newline at end of file
diff --git a/generation_config.json b/generation_config.json
new file mode 100644
index 0000000000000000000000000000000000000000..55942563772385555a04b7be7ce33240c1c2d15e
--- /dev/null
+++ b/generation_config.json
@@ -0,0 +1,11 @@
+{
+ "_from_model_config": true,
+ "eos_token_id": [
+ 151329,
+ 151336,
+ 151338
+ ],
+ "temperature": 1.0,
+ "pad_token_id": 151329,
+ "transformers_version": "4.54.0"
+}
diff --git a/model-00001-of-00092.safetensors b/model-00001-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..60f51f68033717b3e74ca1b1b1364f2323397d4d
--- /dev/null
+++ b/model-00001-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:792e4fc6b8e4d2a80621c5293cbe8f3f224c992d0a8ef063336c7101ffb93ab2
+size 1877199768
diff --git a/model-00002-of-00092.safetensors b/model-00002-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..96a003163d85f42742f5c4703161ed987fad7668
--- /dev/null
+++ b/model-00002-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6dbab970e29d8fa7702f18eb66f79c01ccf281fdf67aa771b9f5b31cfa5cea94
+size 325307112
diff --git a/model-00003-of-00092.safetensors b/model-00003-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..0afeb191aad68c9da86fad64e22ffdcb9df2aacf
--- /dev/null
+++ b/model-00003-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:83f8b33ea59f013c8a841e33c4048c715c0b03fb01ee613b97ea7bd74edd950c
+size 325307112
diff --git a/model-00004-of-00092.safetensors b/model-00004-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..ef4f528c474108fba6afd63d164908528a84fed9
--- /dev/null
+++ b/model-00004-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d75ef26d0a512f49da588bc48b34803e177c97548f93433d945b157e57b279c1
+size 3941942552
diff --git a/model-00005-of-00092.safetensors b/model-00005-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..2958b1c79e9d1d2d8d15fd2cc5b926b3c2010f91
--- /dev/null
+++ b/model-00005-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:67404a14a1cc5fcaf7e43a37e4f528d72ff0b7f6b94cc75eda88487e1a2fde64
+size 3941942552
diff --git a/model-00006-of-00092.safetensors b/model-00006-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..d20a0d94cb627f1967639bacc92639cc80d23ce5
--- /dev/null
+++ b/model-00006-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:def0745e82451676a2f559ee82c3b64bba143eb892e0f5342876a6b625398f89
+size 3941942552
diff --git a/model-00007-of-00092.safetensors b/model-00007-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..a62f2fad1c490509ae8d716dbf0a5f886bb3ea32
--- /dev/null
+++ b/model-00007-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:59c7a39c12f940822cc71219221dd6e6db2152dd7a0fca9e09032ba2d8b76d8e
+size 3941942552
diff --git a/model-00008-of-00092.safetensors b/model-00008-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..c0bb9d7cdd8f5816d55a329c4da1ab26ed971811
--- /dev/null
+++ b/model-00008-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:809a46b2407e77d5c402ce8c4addda1755d5ee010baf917896249a92d3950c9b
+size 3941942552
diff --git a/model-00009-of-00092.safetensors b/model-00009-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..27520bf7a8bb10143b9dffd1f83e9e59a5e6ecaa
--- /dev/null
+++ b/model-00009-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:00f6c14f9255342e68d2a1dac7100336a07f3969506f7e868f4b06b0e9207322
+size 3941942552
diff --git a/model-00010-of-00092.safetensors b/model-00010-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..ad1261fd83ac39b336c899586e044112b9f7983f
--- /dev/null
+++ b/model-00010-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cb1a035e85a2cead00949b7897ce3c8517f1f32a072624d812eb3c927721baef
+size 3941942552
diff --git a/model-00011-of-00092.safetensors b/model-00011-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..7176823959bb6a0aecfa7931017ae232e16b03ce
--- /dev/null
+++ b/model-00011-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b558e5c2b9f22a1dd3add3fb74828b2bcdd9fb04b683a0b49d53ee21d8c261a0
+size 3941943536
diff --git a/model-00012-of-00092.safetensors b/model-00012-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..0eb4b9c1b389eef5815e1b742ca74ebe0f1834bc
--- /dev/null
+++ b/model-00012-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4360c5ad4b0bf089cf0991f5d1234264b8194b239ec5df9233701777ea44b7be
+size 3941943536
diff --git a/model-00013-of-00092.safetensors b/model-00013-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..fc101fd2d2adef7b99178786c03b16289a6706f1
--- /dev/null
+++ b/model-00013-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e1213d84e0061ec6963b099b76dbbcc895509e8e5099ca171d634c502d55ba52
+size 3941943536
diff --git a/model-00014-of-00092.safetensors b/model-00014-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..dda78af8423fa581c4d13f224d9b32bbf799412e
--- /dev/null
+++ b/model-00014-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a71970c0adbcbe333c2d2fddbbc0e27dd1fae877f480b407a2c3044521e03b23
+size 3941943536
diff --git a/model-00015-of-00092.safetensors b/model-00015-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..20fcd3cd75122caf1165462636daed4e587eac55
--- /dev/null
+++ b/model-00015-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b0b7cb187b9644504f5b4ffcfdf1db181d2ff0f99a5a70b3835f97dfb6e922c7
+size 3941943536
diff --git a/model-00016-of-00092.safetensors b/model-00016-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..4dd201a2212ce99b18089cfc885a973248066414
--- /dev/null
+++ b/model-00016-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9cd6921f2fd7ed226fcda639b03e8293725440e03495c34b04ed4373d77451cd
+size 3941943536
diff --git a/model-00017-of-00092.safetensors b/model-00017-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..e6f579f3c78c60c1783520741a8972d9d579a751
--- /dev/null
+++ b/model-00017-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e43f1ae28d72e0487d39a125e4593d58527a8447fbb961c4ddcfe498144033e2
+size 3941943536
diff --git a/model-00018-of-00092.safetensors b/model-00018-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..4bae237a3762e11d311b422f8a49cef66529ae61
--- /dev/null
+++ b/model-00018-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0df123959b5917759f12c03c2b8813c9e00dee9bf4fd14ee1c42d9c49e92c47c
+size 3941943536
diff --git a/model-00019-of-00092.safetensors b/model-00019-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..7b975ac707778e0e9c228d5de312951b1cefa17c
--- /dev/null
+++ b/model-00019-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9a8c8c4fc764fbcce316a59de9e862ad1e5b289a5350deec408a05efdc5fa4b0
+size 3941943536
diff --git a/model-00020-of-00092.safetensors b/model-00020-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..e5c769c9ed21a4e643047b6477d6d0f73936dd67
--- /dev/null
+++ b/model-00020-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e389a315ca8dd1ec1e5b5dfd363b5313179ee438f475f85a7d14cc9a802a6055
+size 3941943536
diff --git a/model-00021-of-00092.safetensors b/model-00021-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..d8fba06edad4e25177f0e38022c7109256f36158
--- /dev/null
+++ b/model-00021-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bcefb72e78bd4b0d4ac7275551ea96af0739574b9a56dd8b9d2c2e84c87faf78
+size 3941943536
diff --git a/model-00022-of-00092.safetensors b/model-00022-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..f3570ae073d27619798644765eae10b9300955d2
--- /dev/null
+++ b/model-00022-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a06c02892eb0d93ad39f082c920d0587d5c2be070e0912395b29ad1379567038
+size 3941943536
diff --git a/model-00023-of-00092.safetensors b/model-00023-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..d99a686ccb567eeb0cc60ed1c086b0625b9cc6cc
--- /dev/null
+++ b/model-00023-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:862d0456fd272189d65fc09c5b9888337efa066d881352bca2365db1e5350c6e
+size 3941943536
diff --git a/model-00024-of-00092.safetensors b/model-00024-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..5ecbb3092a74991f830cf35b8ca5e2d93718fffc
--- /dev/null
+++ b/model-00024-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1cf520b647b1b7adbd0fb33c7d02fb969907575c7893b4bedd57c96d7b3d883a
+size 3941943536
diff --git a/model-00025-of-00092.safetensors b/model-00025-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..bae2e1fc251a263b7d96269b5bfd9af314732e39
--- /dev/null
+++ b/model-00025-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0a66a852ff2bf51eb1bf88620c7664f428899cd88618e7bb0306112cc1791fbb
+size 3941943536
diff --git a/model-00026-of-00092.safetensors b/model-00026-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..454769b8c55b254a7e377ebf3d3ebc1b5b1fe9f0
--- /dev/null
+++ b/model-00026-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a850f74a0948773c497feb9cf50e887fabe03eb372c37b894d283fb8ae05047a
+size 3941943536
diff --git a/model-00027-of-00092.safetensors b/model-00027-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..7a5e3edd43d2ef0eb40bc3665b09bee71a3ba75b
--- /dev/null
+++ b/model-00027-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dbd77174221f3284c6d0c401c09d9e721f04663fead02d5d32b1f9e7e4b0b078
+size 3941943536
diff --git a/model-00028-of-00092.safetensors b/model-00028-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..70ab3e62be621043459d1acd228f468fc7d01cbf
--- /dev/null
+++ b/model-00028-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e8b6004f6572455d234ac82602c8733c515efde70f92cd36b9bcd8471d43af87
+size 3941943536
diff --git a/model-00029-of-00092.safetensors b/model-00029-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..e5707dcda1ce6ef72cb468f6a92e9db8db2ba82c
--- /dev/null
+++ b/model-00029-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:72f254cbcdb9b30d7e8ee27d8961a08e560c09a8aa6aa93cc28ef7261b178d72
+size 3941943536
diff --git a/model-00030-of-00092.safetensors b/model-00030-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..7ba17b6c527937b2fa6bedcb6b66fc731af79195
--- /dev/null
+++ b/model-00030-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8ffcaf23d3adb8f57cf45af3f8029c8e04bb755355aa45ea337cc52541ddad50
+size 3941943536
diff --git a/model-00031-of-00092.safetensors b/model-00031-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..2dba93e493de4ff2c7e338deb68f0a9fbfa4dd07
--- /dev/null
+++ b/model-00031-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6b3fb01326e67340e73807e98b1b32f00434d4645aa494d08f3534b6a6559bfb
+size 3941943536
diff --git a/model-00032-of-00092.safetensors b/model-00032-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..e0c281cdc80d88f7c874f0c9f806ec756faa8a63
--- /dev/null
+++ b/model-00032-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:179b66d37cebac7d16e495bc3b818f4dcf905567b51966ea4c31eb3e2ffc96db
+size 3941943536
diff --git a/model-00033-of-00092.safetensors b/model-00033-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..f2583393d244d9ab3b49bd4f28f379fcca5968c7
--- /dev/null
+++ b/model-00033-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4d0424954737a9b0e537f9c258c26f7602c2d45a0790a6708a2b6f9205719ef5
+size 3941943536
diff --git a/model-00034-of-00092.safetensors b/model-00034-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..21d3882a3613797c9a4c3ee1a7f547860863638a
--- /dev/null
+++ b/model-00034-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:17826f12a95cb2fd4b2395976145cba948b08d3254828154f042d4f0c4e0ec6e
+size 3941943536
diff --git a/model-00035-of-00092.safetensors b/model-00035-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..cb286ee6b06396263bd1cb7979f1f198b6f37206
--- /dev/null
+++ b/model-00035-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:15d2883ad4ce8e824ae2643664f26e443cc1d0211b3a959b3500ec382442cc35
+size 3941943536
diff --git a/model-00036-of-00092.safetensors b/model-00036-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..6d91c8fe82fb64b14e31cd7379037bd07e6d788b
--- /dev/null
+++ b/model-00036-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:790ed51498aa9c7bd89cf5a6c992a7e5f1a4c11fbf7442109861dee4ee1da545
+size 3941943536
diff --git a/model-00037-of-00092.safetensors b/model-00037-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..abf366ac4f8ff8c47fe6613254e29757e90f5ee2
--- /dev/null
+++ b/model-00037-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2e6e93031b97c013bd788fc2cc50c0f63e27467d385c2ebe5fac868bfcb702e9
+size 3941943536
diff --git a/model-00038-of-00092.safetensors b/model-00038-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..c7df67c9e1d131193ef82537748e64ddeecf8527
--- /dev/null
+++ b/model-00038-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:36817ddbedc45efa0d1456380efa0da082230e8f17fc4bd9a3371d6483d2a269
+size 3941943536
diff --git a/model-00039-of-00092.safetensors b/model-00039-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..b38b93f6d0210f5b64a2eec7436e724a530895ae
--- /dev/null
+++ b/model-00039-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1c055d384cccbb058ffb1340aa8257dd6fe7dd3e36d6b42ddbdfb376ef913a92
+size 3941943536
diff --git a/model-00040-of-00092.safetensors b/model-00040-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..45ab4b2c5984b98d3f1a81efb7e4b8fb71ff67d0
--- /dev/null
+++ b/model-00040-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0f915a463515c2dc598384977f87fe13c7bbba1472f6805ed8a95ee0db7ba189
+size 3941943536
diff --git a/model-00041-of-00092.safetensors b/model-00041-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..d5ca7d3e6efaf73e0e874a0c0d4761cff412a845
--- /dev/null
+++ b/model-00041-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d3b189147fae2fc8687d7ca6fd8fd18cd0e0c06b4e2503b8e5e756eda9e514c0
+size 3941943536
diff --git a/model-00042-of-00092.safetensors b/model-00042-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..1de06352acdb36079c06b5c8393c70064b8f37f6
--- /dev/null
+++ b/model-00042-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:edbfcb70d09a5e6ad08656fd99eb295a980b7ba620194779f83d6bec4c0bb398
+size 3941943536
diff --git a/model-00043-of-00092.safetensors b/model-00043-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..fb0b5c0afaf3222106b5e00fad1d7767100dcbf6
--- /dev/null
+++ b/model-00043-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6b7ca94fef251671134ac6dba9caff54575cf642559ef9c6d454360b3de8c3a9
+size 3941943536
diff --git a/model-00044-of-00092.safetensors b/model-00044-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..97654a89f72ad432987bae7d19eb69c95c9c0a73
--- /dev/null
+++ b/model-00044-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ee218d7ef8992c0240971a42f34bdeeb8db671150e827987cfb261c29bf31101
+size 3941943536
diff --git a/model-00045-of-00092.safetensors b/model-00045-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..24a1a72fa2a60470bd0a007f069f57d1db694657
--- /dev/null
+++ b/model-00045-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:79d6a523ee12a52e3e7478c1aa0de766e958d86bfab42a31e71ab2437dabe238
+size 3941943536
diff --git a/model-00046-of-00092.safetensors b/model-00046-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..c8671c90fad8f22d5ff3987ac604da399f9b4bf6
--- /dev/null
+++ b/model-00046-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bff3444aa40c5904a1ee7d49d7c16ab6f710f1cfc23b82a1cae3ff4c96cae7ec
+size 3941943536
diff --git a/model-00047-of-00092.safetensors b/model-00047-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..322f08471c39bdd79bcbb2731b636aeaced392ef
--- /dev/null
+++ b/model-00047-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:83b48b4c4efabe707b15f36d1c3111e8b4ae5d4150b1409f3265cf9ae0cc10df
+size 3941943536
diff --git a/model-00048-of-00092.safetensors b/model-00048-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..ceecd1fb606e74911dde25c671df87d82acc8757
--- /dev/null
+++ b/model-00048-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5210b3bddeeffb0ae0324570719c0fa9d86e0925cb9af441325c300b33ee2c21
+size 3941943536
diff --git a/model-00049-of-00092.safetensors b/model-00049-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..970047dffd438ffe494a3f27df4f03f4c7682c96
--- /dev/null
+++ b/model-00049-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6401829e178f6e38e0043c7198a5471f0275ceb117e4979519ada9c9b6b5fd90
+size 3941943536
diff --git a/model-00050-of-00092.safetensors b/model-00050-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..06abc4146c3fa7863d2a3af66bf8ea67e10e4259
--- /dev/null
+++ b/model-00050-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1ad02c1d52d07b8e9cdb446196b1d6e0ad4d9320ce0e714b997675861f6a3204
+size 3941943536
diff --git a/model-00051-of-00092.safetensors b/model-00051-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..85b3a4e60ad7a34757aceb17aa53ba4b3ff0eda1
--- /dev/null
+++ b/model-00051-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:eb77712e3ed83041cdf154b564c03b2749408e987b30616710e19b73895a606d
+size 3941943536
diff --git a/model-00052-of-00092.safetensors b/model-00052-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..8096a476f9df2857ce068e8aea63ce4acb62ee7e
--- /dev/null
+++ b/model-00052-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:76cc02458ec6466703e4c3c5ca111c1f19185c4b431370aa40231fe2274da81e
+size 3941943536
diff --git a/model-00053-of-00092.safetensors b/model-00053-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..1d3f35e5e0392cefce74b60a153891e76a619adb
--- /dev/null
+++ b/model-00053-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d023200f696a4cb10e8a11b6a4017c10cab5ea3b74b4780eabb4a9aa75154e0e
+size 3941943536
diff --git a/model-00054-of-00092.safetensors b/model-00054-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..336f9d4f0bf95554ecf0928ef3eace769970ee7b
--- /dev/null
+++ b/model-00054-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6832598c997fc794e5e28e544e5eb6bf8d2d25df75b8c744261d43b2a3335b49
+size 3941943536
diff --git a/model-00055-of-00092.safetensors b/model-00055-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..b27d5b9d45f6f66837e3e98c79a7578793195dce
--- /dev/null
+++ b/model-00055-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f450bc3bf71585510de4fad9a3b27ff77d339c8788dff86f250e8d470773422c
+size 3941943536
diff --git a/model-00056-of-00092.safetensors b/model-00056-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..b63a86cd9c011d0a6cc303b713fe9ebce1d1d5f8
--- /dev/null
+++ b/model-00056-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c2d150833d052066239cad9016bf95665902879aaf8badaac1435277df5fc0a5
+size 3941943536
diff --git a/model-00057-of-00092.safetensors b/model-00057-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..efe0e5d3f4a016d1e53aef3b040532a514fa5eb5
--- /dev/null
+++ b/model-00057-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9e4f8f4b432a677fd19a782222399acfdb4b77fe7c4217ccea0aee7b09cdb4a7
+size 3941943536
diff --git a/model-00058-of-00092.safetensors b/model-00058-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..a2d7c5b8845fea912c83cfadf671a12d949c0aaf
--- /dev/null
+++ b/model-00058-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cbbcb5209dbc3500d1d8a76cb605e92b179b30fe05477d633200d066950634cd
+size 3941943536
diff --git a/model-00059-of-00092.safetensors b/model-00059-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..ac59c2313104281fe0fb7d4c11652bd15a2f3961
--- /dev/null
+++ b/model-00059-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:94483530501d4921699f31ffd2f008bcae2975ac5b6b378c943daa4a3cf6edef
+size 3941943536
diff --git a/model-00060-of-00092.safetensors b/model-00060-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..6665c235232b506d9c55cdff3abdbf31a351020e
--- /dev/null
+++ b/model-00060-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d2f0ba41b3e09369a27f8e1f811a1455aa7fd9787914289196fb3e973b513a9a
+size 3941943536
diff --git a/model-00061-of-00092.safetensors b/model-00061-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..fe16a8e9d1d5980aa2a03651020fa8699270965d
--- /dev/null
+++ b/model-00061-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3bc1544f7d4098a9ee89cc4e2b2b970e9a44a85ea05cc133a3cbf2a145186646
+size 3941943536
diff --git a/model-00062-of-00092.safetensors b/model-00062-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..69b5fa1d3526c00ccff1309f2e1fe24fd50608fb
--- /dev/null
+++ b/model-00062-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e05d05d7e791eb21af68621624e6f2dbc3bd6ff1858a275278aef87dd3e9b490
+size 3941943536
diff --git a/model-00063-of-00092.safetensors b/model-00063-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..b5c2093e01f957c2784bc21a6c67fbe0428e3fba
--- /dev/null
+++ b/model-00063-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7d4057eda737a92199d74fd80c18b4886f0805ba954ee6e6ed4abb21da19a0dc
+size 3941943536
diff --git a/model-00064-of-00092.safetensors b/model-00064-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..6373cf91d90d39251edb93306e1b268a0e146565
--- /dev/null
+++ b/model-00064-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cf447bb87d72a6e32425bc9818d98cb95b2211dd7bf54a1d2e423753a2179cb2
+size 3941943536
diff --git a/model-00065-of-00092.safetensors b/model-00065-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..41f38645d35de33177dd4428ae2c72ccfa9eb7bf
--- /dev/null
+++ b/model-00065-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:808551308d25597c7d2850f75dc7a8706f22e2581a54cc4e87e01a307bc53553
+size 3941943536
diff --git a/model-00066-of-00092.safetensors b/model-00066-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..689f7a6d9b782b878167de340499166e6ca067d0
--- /dev/null
+++ b/model-00066-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0a9cf9eb8e46f6f63215377b153e078e990c7deaadf7de8c5806befe0ba6eec5
+size 3941943536
diff --git a/model-00067-of-00092.safetensors b/model-00067-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..a168c11d7d22875b4bf4b162ac201daf60fe7075
--- /dev/null
+++ b/model-00067-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:54df94ffda62e97e8c1cbcf43aea6a6dd129ac918fbd3b57705d3dcd3ab018fe
+size 3941943536
diff --git a/model-00068-of-00092.safetensors b/model-00068-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..9357f3a6922107bf69ccceb5c6aa3815ee67611e
--- /dev/null
+++ b/model-00068-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5caefe9ea8c24b4f1f81b83d45cf59b545896a2b320a1ac84e720d8c09c9d30b
+size 3941943536
diff --git a/model-00069-of-00092.safetensors b/model-00069-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..f67abc654f50ed34314fe7ae3d2bce3edba7810a
--- /dev/null
+++ b/model-00069-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cab8e5b71bd3e540daf2f44bc7e70c81d5c225ee1c6814270f1afc6948272ece
+size 3941943536
diff --git a/model-00070-of-00092.safetensors b/model-00070-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..2f7eb587487dd1b115fdfdb78792341445c7361a
--- /dev/null
+++ b/model-00070-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:94235934eeb095493aa324ae10b36449aa3c9f791fe54696fd8de97b29b2c0db
+size 3941943536
diff --git a/model-00071-of-00092.safetensors b/model-00071-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..699c2db98ae1c1d73b2b9aec92eac9ff01294f9a
--- /dev/null
+++ b/model-00071-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:09e22042d1f6533d89e5ed983c7b71ceccbdfff0902a8d159a42128e987670e4
+size 3941943536
diff --git a/model-00072-of-00092.safetensors b/model-00072-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..82e245325bd6f5421d5bf7e6c01ecbc678c7f8ca
--- /dev/null
+++ b/model-00072-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1d18ac7900d087701c4ba6effc4fa21f2ebfdad8b77bf4bad193b6af847d65b2
+size 3941943536
diff --git a/model-00073-of-00092.safetensors b/model-00073-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..26f07ee68865ee22150d1a14327e186e7de9e175
--- /dev/null
+++ b/model-00073-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ab0f07f3b9be9055353d9da3e6a85090fe5e6f07520e42952f4dbd5fd05e1635
+size 3941943536
diff --git a/model-00074-of-00092.safetensors b/model-00074-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..7ab7dedd53bd223c855d642c80d0d05da49e7e6f
--- /dev/null
+++ b/model-00074-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:12c80895305ebef1fe35af62f690850e07c8295fb848092209c54b4799fdd606
+size 3941943536
diff --git a/model-00075-of-00092.safetensors b/model-00075-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..577efa9688e4cb8ca912273e87115bca75fe518c
--- /dev/null
+++ b/model-00075-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e909f89ffc6dcc70a4b052f2f366cdc9a776874b875e75a018bd5acc671b39cd
+size 3941943536
diff --git a/model-00076-of-00092.safetensors b/model-00076-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..410e06a7450ed94933f590b1232c6c83fbb03d9d
--- /dev/null
+++ b/model-00076-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f2b5ea7d814154904df842d3cd845076ba6579f82ea14b7b5c090818a72a1ec9
+size 3941943536
diff --git a/model-00077-of-00092.safetensors b/model-00077-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..74a83472701c6dcf6455f9af60d026c279e2e197
--- /dev/null
+++ b/model-00077-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6264ae4c51303e0a0763f165df4d9fee10b2b4555ab291e5b276a49ece3b18e3
+size 3941943536
diff --git a/model-00078-of-00092.safetensors b/model-00078-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..9224fdf20dacca6eec3931633e59550fba310b5f
--- /dev/null
+++ b/model-00078-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:159e50c9ff99069cb792547db064ba71f03d542c8626ecebb10b990570800bc4
+size 3941943536
diff --git a/model-00079-of-00092.safetensors b/model-00079-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..43a4623ab8a1615328150c18db541117266462e1
--- /dev/null
+++ b/model-00079-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4163812bee41fd9699cbe2fe05f0ba8032f3d48a09a3b4000bd372b7496f64fb
+size 3941943536
diff --git a/model-00080-of-00092.safetensors b/model-00080-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..97b500903c18c0d6a24406c1c52bd84247783fa5
--- /dev/null
+++ b/model-00080-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:77c2f9e2198290a083a595fec2ab521d357bf2886f0ac10c7f0a4130cc30ef7d
+size 3941943536
diff --git a/model-00081-of-00092.safetensors b/model-00081-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..834734dde90432690daf1d9521424ac1a0ea3811
--- /dev/null
+++ b/model-00081-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:69f1fbed934759564fc5c934cc53ceee37a70fa7eec13bf17ceef2afdf244666
+size 3941943536
diff --git a/model-00082-of-00092.safetensors b/model-00082-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..884dcc63832de4cd7859736ee337b64ae84175b2
--- /dev/null
+++ b/model-00082-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:89048d2be89e98d54a15ea59e637b40e10b5d82c57a8752add179f8bec1f76f2
+size 3941943536
diff --git a/model-00083-of-00092.safetensors b/model-00083-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..7cb9663df760fc65d6d786fbfc845e05c9df8c34
--- /dev/null
+++ b/model-00083-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:adcd2d283a7264aee6e7ff286afc487179325d20f408104a78624b0489fcc97a
+size 3941943536
diff --git a/model-00084-of-00092.safetensors b/model-00084-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..29935221c8889e7e4ad44496c1bb2940e938cee0
--- /dev/null
+++ b/model-00084-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:68870660b2938451eef7e1abaa8a3005d98ecc2f8c5ec46e222d81109b5d375d
+size 3941943536
diff --git a/model-00085-of-00092.safetensors b/model-00085-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..6c5d63d50bc4ecaf121ad406c2cdd30d2f9ab746
--- /dev/null
+++ b/model-00085-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:991ad9e61d555831e56a7f4b3a6099b0e043fcc48933c3b6e806862c1f4c086c
+size 3941943536
diff --git a/model-00086-of-00092.safetensors b/model-00086-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..5ae14410927872243b2204d5aafaf867059fa2b5
--- /dev/null
+++ b/model-00086-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3ea419160c41c7d3e598eaccbf27f6c275c7af9d74abb63f695d7e82ae44a3ea
+size 3941943536
diff --git a/model-00087-of-00092.safetensors b/model-00087-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..7eebfea5dcc1a08b135973e4e44ea4c68f2f60a3
--- /dev/null
+++ b/model-00087-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:be730c6eebce8fa762b2522cfbb1f5dbc1f14f6e4634097519e1b0f5dde212e5
+size 3941943536
diff --git a/model-00088-of-00092.safetensors b/model-00088-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..fa4c9a6aad8221bd4b1e3ab1d4dc895a397cf6ff
--- /dev/null
+++ b/model-00088-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cf49764e5a379ae8f00762a710a159eddf830e1bf8d31357ea4dbe7d8a872555
+size 3941943536
diff --git a/model-00089-of-00092.safetensors b/model-00089-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..28ff1698875a82335f81f9a567c39145723f4960
--- /dev/null
+++ b/model-00089-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3e0ee2961ff627ee59e4018a962c031d0a599cc4053f7a7b5c35db9d5c3b243a
+size 3941943536
diff --git a/model-00090-of-00092.safetensors b/model-00090-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..55be17c0144023b6dc99affda8b870dd48702fbb
--- /dev/null
+++ b/model-00090-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f0c5a39ff0b581d28218d231ff97ea957888ab93076f647c35904e4d6e77dd99
+size 3941943536
diff --git a/model-00091-of-00092.safetensors b/model-00091-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..c0d72539f03be388e9261fd33747cbe90c46135b
--- /dev/null
+++ b/model-00091-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8d61b99736f291083d612fa9dc4f7fc0a8790e56140addbe2c30d40d2829c284
+size 3941943536
diff --git a/model-00092-of-00092.safetensors b/model-00092-of-00092.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..5ff936620feec4f8689fd122f7569e8518c3861d
--- /dev/null
+++ b/model-00092-of-00092.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:df37ea56e9ee14e90db23365cd7ffa6ff202a7668df66ad2eba1fb3022a632fc
+size 5493846760
diff --git a/model.safetensors.index.json b/model.safetensors.index.json
new file mode 100644
index 0000000000000000000000000000000000000000..26636eb07cf84de1ee1f7e05714e660b83d8ba91
--- /dev/null
+++ b/model.safetensors.index.json
@@ -0,0 +1,88060 @@
+{
+ "metadata": {
+ "total_size": 241145664
+ },
+ "weight_map": {
+ "lm_head.weight": "model-00092-of-00092.safetensors",
+ "model.embed_tokens.weight": "model-00001-of-00092.safetensors",
+ "model.layers.0.input_layernorm.weight": "model-00001-of-00092.safetensors",
+ "model.layers.0.mlp.down_proj.weight": "model-00001-of-00092.safetensors",
+ "model.layers.0.mlp.down_proj.weight_scale": "model-00001-of-00092.safetensors",
+ "model.layers.0.mlp.gate_proj.weight": "model-00001-of-00092.safetensors",
+ "model.layers.0.mlp.gate_proj.weight_scale": "model-00001-of-00092.safetensors",
+ "model.layers.0.mlp.up_proj.weight": "model-00001-of-00092.safetensors",
+ "model.layers.0.mlp.up_proj.weight_scale": "model-00001-of-00092.safetensors",
+ "model.layers.0.post_attention_layernorm.weight": "model-00001-of-00092.safetensors",
+ "model.layers.0.self_attn.k_norm.weight": "model-00001-of-00092.safetensors",
+ "model.layers.0.self_attn.k_proj.bias": "model-00001-of-00092.safetensors",
+ "model.layers.0.self_attn.k_proj.weight": "model-00001-of-00092.safetensors",
+ "model.layers.0.self_attn.k_proj.weight_scale": "model-00001-of-00092.safetensors",
+ "model.layers.0.self_attn.o_proj.weight": "model-00001-of-00092.safetensors",
+ "model.layers.0.self_attn.o_proj.weight_scale": "model-00001-of-00092.safetensors",
+ "model.layers.0.self_attn.q_norm.weight": "model-00001-of-00092.safetensors",
+ "model.layers.0.self_attn.q_proj.bias": "model-00001-of-00092.safetensors",
+ "model.layers.0.self_attn.q_proj.weight": "model-00001-of-00092.safetensors",
+ "model.layers.0.self_attn.q_proj.weight_scale": "model-00001-of-00092.safetensors",
+ "model.layers.0.self_attn.v_proj.bias": "model-00001-of-00092.safetensors",
+ "model.layers.0.self_attn.v_proj.weight": "model-00001-of-00092.safetensors",
+ "model.layers.0.self_attn.v_proj.weight_scale": "model-00001-of-00092.safetensors",
+ "model.layers.1.input_layernorm.weight": "model-00002-of-00092.safetensors",
+ "model.layers.1.mlp.down_proj.weight": "model-00002-of-00092.safetensors",
+ "model.layers.1.mlp.down_proj.weight_scale": "model-00002-of-00092.safetensors",
+ "model.layers.1.mlp.gate_proj.weight": "model-00002-of-00092.safetensors",
+ "model.layers.1.mlp.gate_proj.weight_scale": "model-00002-of-00092.safetensors",
+ "model.layers.1.mlp.up_proj.weight": "model-00002-of-00092.safetensors",
+ "model.layers.1.mlp.up_proj.weight_scale": "model-00002-of-00092.safetensors",
+ "model.layers.1.post_attention_layernorm.weight": "model-00002-of-00092.safetensors",
+ "model.layers.1.self_attn.k_norm.weight": "model-00002-of-00092.safetensors",
+ "model.layers.1.self_attn.k_proj.bias": "model-00002-of-00092.safetensors",
+ "model.layers.1.self_attn.k_proj.weight": "model-00002-of-00092.safetensors",
+ "model.layers.1.self_attn.k_proj.weight_scale": "model-00002-of-00092.safetensors",
+ "model.layers.1.self_attn.o_proj.weight": "model-00002-of-00092.safetensors",
+ "model.layers.1.self_attn.o_proj.weight_scale": "model-00002-of-00092.safetensors",
+ "model.layers.1.self_attn.q_norm.weight": "model-00002-of-00092.safetensors",
+ "model.layers.1.self_attn.q_proj.bias": "model-00002-of-00092.safetensors",
+ "model.layers.1.self_attn.q_proj.weight": "model-00002-of-00092.safetensors",
+ "model.layers.1.self_attn.q_proj.weight_scale": "model-00002-of-00092.safetensors",
+ "model.layers.1.self_attn.v_proj.bias": "model-00002-of-00092.safetensors",
+ "model.layers.1.self_attn.v_proj.weight": "model-00002-of-00092.safetensors",
+ "model.layers.1.self_attn.v_proj.weight_scale": "model-00002-of-00092.safetensors",
+ "model.layers.10.input_layernorm.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.0.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.0.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.0.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.0.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.0.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.0.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.1.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.1.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.1.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.1.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.1.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.1.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.10.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.10.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.10.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.10.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.10.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.10.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.100.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.100.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.100.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.100.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.100.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.100.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.101.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.101.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.101.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.101.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.101.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.101.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.102.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.102.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.102.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.102.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.102.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.102.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.103.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.103.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.103.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.103.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.103.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.103.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.104.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.104.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.104.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.104.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.104.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.104.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.105.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.105.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.105.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.105.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.105.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.105.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.106.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.106.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.106.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.106.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.106.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.106.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.107.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.107.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.107.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.107.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.107.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.107.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.108.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.108.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.108.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.108.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.108.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.108.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.109.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.109.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.109.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.109.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.109.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.109.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.11.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.11.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.11.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.11.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.11.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.11.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.110.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.110.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.110.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.110.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.110.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.110.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.111.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.111.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.111.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.111.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.111.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.111.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.112.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.112.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.112.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.112.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.112.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.112.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.113.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.113.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.113.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.113.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.113.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.113.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.114.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.114.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.114.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.114.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.114.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.114.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.115.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.115.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.115.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.115.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.115.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.115.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.116.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.116.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.116.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.116.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.116.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.116.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.117.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.117.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.117.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.117.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.117.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.117.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.118.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.118.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.118.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.118.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.118.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.118.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.119.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.119.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.119.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.119.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.119.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.119.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.12.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.12.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.12.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.12.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.12.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.12.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.120.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.120.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.120.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.120.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.120.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.120.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.121.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.121.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.121.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.121.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.121.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.121.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.122.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.122.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.122.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.122.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.122.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.122.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.123.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.123.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.123.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.123.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.123.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.123.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.124.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.124.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.124.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.124.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.124.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.124.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.125.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.125.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.125.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.125.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.125.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.125.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.126.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.126.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.126.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.126.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.126.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.126.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.127.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.127.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.127.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.127.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.127.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.127.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.128.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.128.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.128.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.128.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.128.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.128.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.129.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.129.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.129.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.129.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.129.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.129.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.13.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.13.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.13.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.13.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.13.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.13.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.130.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.130.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.130.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.130.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.130.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.130.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.131.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.131.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.131.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.131.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.131.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.131.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.132.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.132.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.132.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.132.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.132.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.132.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.133.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.133.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.133.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.133.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.133.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.133.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.134.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.134.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.134.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.134.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.134.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.134.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.135.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.135.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.135.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.135.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.135.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.135.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.136.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.136.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.136.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.136.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.136.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.136.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.137.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.137.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.137.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.137.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.137.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.137.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.138.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.138.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.138.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.138.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.138.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.138.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.139.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.139.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.139.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.139.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.139.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.139.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.14.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.14.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.14.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.14.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.14.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.14.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.140.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.140.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.140.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.140.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.140.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.140.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.141.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.141.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.141.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.141.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.141.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.141.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.142.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.142.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.142.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.142.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.142.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.142.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.143.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.143.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.143.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.143.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.143.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.143.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.144.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.144.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.144.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.144.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.144.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.144.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.145.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.145.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.145.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.145.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.145.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.145.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.146.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.146.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.146.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.146.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.146.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.146.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.147.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.147.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.147.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.147.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.147.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.147.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.148.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.148.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.148.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.148.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.148.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.148.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.149.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.149.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.149.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.149.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.149.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.149.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.15.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.15.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.15.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.15.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.15.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.15.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.150.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.150.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.150.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.150.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.150.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.150.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.151.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.151.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.151.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.151.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.151.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.151.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.152.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.152.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.152.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.152.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.152.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.152.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.153.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.153.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.153.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.153.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.153.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.153.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.154.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.154.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.154.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.154.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.154.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.154.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.155.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.155.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.155.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.155.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.155.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.155.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.156.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.156.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.156.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.156.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.156.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.156.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.157.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.157.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.157.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.157.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.157.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.157.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.158.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.158.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.158.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.158.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.158.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.158.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.159.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.159.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.159.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.159.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.159.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.159.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.16.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.16.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.16.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.16.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.16.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.16.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.17.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.17.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.17.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.17.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.17.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.17.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.18.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.18.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.18.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.18.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.18.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.18.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.19.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.19.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.19.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.19.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.19.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.19.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.2.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.2.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.2.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.2.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.2.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.2.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.20.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.20.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.20.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.20.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.20.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.20.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.21.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.21.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.21.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.21.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.21.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.21.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.22.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.22.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.22.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.22.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.22.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.22.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.23.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.23.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.23.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.23.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.23.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.23.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.24.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.24.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.24.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.24.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.24.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.24.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.25.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.25.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.25.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.25.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.25.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.25.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.26.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.26.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.26.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.26.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.26.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.26.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.27.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.27.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.27.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.27.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.27.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.27.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.28.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.28.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.28.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.28.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.28.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.28.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.29.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.29.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.29.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.29.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.29.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.29.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.3.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.3.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.3.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.3.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.3.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.3.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.30.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.30.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.30.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.30.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.30.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.30.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.31.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.31.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.31.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.31.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.31.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.31.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.32.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.32.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.32.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.32.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.32.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.32.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.33.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.33.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.33.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.33.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.33.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.33.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.34.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.34.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.34.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.34.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.34.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.34.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.35.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.35.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.35.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.35.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.35.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.35.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.36.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.36.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.36.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.36.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.36.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.36.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.37.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.37.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.37.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.37.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.37.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.37.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.38.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.38.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.38.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.38.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.38.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.38.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.39.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.39.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.39.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.39.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.39.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.39.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.4.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.4.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.4.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.4.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.4.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.4.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.40.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.40.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.40.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.40.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.40.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.40.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.41.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.41.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.41.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.41.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.41.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.41.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.42.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.42.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.42.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.42.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.42.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.42.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.43.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.43.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.43.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.43.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.43.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.43.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.44.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.44.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.44.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.44.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.44.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.44.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.45.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.45.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.45.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.45.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.45.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.45.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.46.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.46.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.46.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.46.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.46.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.46.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.47.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.47.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.47.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.47.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.47.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.47.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.48.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.48.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.48.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.48.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.48.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.48.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.49.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.49.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.49.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.49.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.49.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.49.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.5.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.5.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.5.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.5.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.5.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.5.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.50.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.50.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.50.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.50.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.50.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.50.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.51.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.51.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.51.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.51.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.51.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.51.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.52.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.52.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.52.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.52.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.52.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.52.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.53.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.53.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.53.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.53.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.53.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.53.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.54.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.54.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.54.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.54.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.54.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.54.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.55.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.55.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.55.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.55.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.55.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.55.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.56.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.56.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.56.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.56.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.56.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.56.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.57.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.57.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.57.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.57.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.57.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.57.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.58.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.58.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.58.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.58.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.58.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.58.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.59.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.59.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.59.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.59.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.59.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.59.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.6.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.6.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.6.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.6.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.6.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.6.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.60.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.60.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.60.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.60.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.60.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.60.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.61.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.61.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.61.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.61.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.61.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.61.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.62.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.62.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.62.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.62.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.62.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.62.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.63.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.63.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.63.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.63.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.63.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.63.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.64.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.64.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.64.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.64.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.64.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.64.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.65.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.65.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.65.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.65.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.65.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.65.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.66.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.66.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.66.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.66.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.66.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.66.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.67.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.67.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.67.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.67.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.67.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.67.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.68.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.68.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.68.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.68.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.68.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.68.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.69.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.69.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.69.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.69.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.69.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.69.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.7.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.7.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.7.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.7.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.7.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.7.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.70.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.70.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.70.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.70.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.70.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.70.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.71.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.71.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.71.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.71.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.71.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.71.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.72.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.72.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.72.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.72.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.72.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.72.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.73.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.73.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.73.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.73.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.73.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.73.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.74.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.74.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.74.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.74.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.74.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.74.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.75.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.75.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.75.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.75.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.75.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.75.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.76.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.76.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.76.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.76.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.76.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.76.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.77.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.77.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.77.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.77.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.77.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.77.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.78.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.78.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.78.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.78.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.78.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.78.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.79.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.79.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.79.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.79.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.79.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.79.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.8.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.8.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.8.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.8.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.8.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.8.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.80.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.80.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.80.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.80.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.80.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.80.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.81.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.81.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.81.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.81.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.81.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.81.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.82.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.82.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.82.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.82.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.82.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.82.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.83.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.83.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.83.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.83.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.83.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.83.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.84.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.84.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.84.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.84.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.84.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.84.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.85.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.85.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.85.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.85.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.85.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.85.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.86.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.86.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.86.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.86.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.86.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.86.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.87.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.87.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.87.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.87.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.87.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.87.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.88.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.88.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.88.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.88.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.88.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.88.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.89.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.89.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.89.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.89.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.89.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.89.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.9.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.9.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.9.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.9.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.9.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.9.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.90.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.90.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.90.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.90.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.90.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.90.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.91.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.91.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.91.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.91.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.91.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.91.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.92.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.92.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.92.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.92.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.92.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.92.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.93.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.93.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.93.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.93.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.93.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.93.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.94.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.94.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.94.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.94.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.94.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.94.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.95.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.95.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.95.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.95.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.95.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.95.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.96.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.96.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.96.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.96.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.96.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.96.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.97.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.97.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.97.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.97.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.97.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.97.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.98.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.98.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.98.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.98.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.98.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.98.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.99.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.99.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.99.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.99.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.99.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.experts.99.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.gate.e_score_correction_bias": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.gate.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.shared_experts.down_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.shared_experts.down_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.shared_experts.gate_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.shared_experts.gate_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.shared_experts.up_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.mlp.shared_experts.up_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.post_attention_layernorm.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.self_attn.k_norm.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.self_attn.k_proj.bias": "model-00011-of-00092.safetensors",
+ "model.layers.10.self_attn.k_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.self_attn.k_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.self_attn.o_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.self_attn.o_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.self_attn.q_norm.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.self_attn.q_proj.bias": "model-00011-of-00092.safetensors",
+ "model.layers.10.self_attn.q_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.self_attn.q_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.10.self_attn.v_proj.bias": "model-00011-of-00092.safetensors",
+ "model.layers.10.self_attn.v_proj.weight": "model-00011-of-00092.safetensors",
+ "model.layers.10.self_attn.v_proj.weight_scale": "model-00011-of-00092.safetensors",
+ "model.layers.11.input_layernorm.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.0.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.0.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.0.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.0.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.0.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.0.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.1.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.1.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.1.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.1.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.1.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.1.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.10.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.10.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.10.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.10.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.10.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.10.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.100.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.100.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.100.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.100.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.100.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.100.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.101.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.101.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.101.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.101.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.101.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.101.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.102.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.102.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.102.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.102.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.102.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.102.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.103.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.103.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.103.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.103.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.103.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.103.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.104.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.104.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.104.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.104.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.104.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.104.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.105.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.105.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.105.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.105.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.105.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.105.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.106.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.106.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.106.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.106.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.106.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.106.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.107.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.107.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.107.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.107.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.107.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.107.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.108.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.108.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.108.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.108.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.108.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.108.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.109.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.109.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.109.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.109.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.109.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.109.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.11.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.11.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.11.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.11.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.11.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.11.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.110.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.110.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.110.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.110.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.110.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.110.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.111.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.111.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.111.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.111.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.111.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.111.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.112.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.112.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.112.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.112.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.112.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.112.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.113.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.113.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.113.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.113.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.113.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.113.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.114.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.114.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.114.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.114.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.114.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.114.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.115.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.115.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.115.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.115.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.115.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.115.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.116.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.116.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.116.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.116.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.116.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.116.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.117.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.117.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.117.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.117.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.117.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.117.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.118.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.118.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.118.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.118.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.118.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.118.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.119.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.119.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.119.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.119.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.119.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.119.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.12.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.12.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.12.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.12.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.12.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.12.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.120.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.120.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.120.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.120.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.120.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.120.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.121.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.121.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.121.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.121.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.121.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.121.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.122.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.122.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.122.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.122.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.122.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.122.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.123.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.123.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.123.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.123.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.123.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.123.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.124.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.124.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.124.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.124.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.124.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.124.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.125.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.125.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.125.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.125.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.125.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.125.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.126.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.126.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.126.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.126.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.126.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.126.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.127.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.127.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.127.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.127.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.127.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.127.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.128.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.128.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.128.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.128.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.128.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.128.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.129.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.129.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.129.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.129.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.129.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.129.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.13.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.13.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.13.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.13.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.13.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.13.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.130.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.130.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.130.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.130.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.130.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.130.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.131.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.131.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.131.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.131.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.131.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.131.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.132.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.132.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.132.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.132.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.132.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.132.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.133.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.133.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.133.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.133.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.133.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.133.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.134.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.134.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.134.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.134.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.134.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.134.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.135.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.135.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.135.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.135.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.135.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.135.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.136.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.136.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.136.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.136.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.136.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.136.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.137.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.137.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.137.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.137.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.137.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.137.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.138.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.138.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.138.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.138.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.138.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.138.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.139.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.139.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.139.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.139.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.139.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.139.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.14.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.14.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.14.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.14.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.14.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.14.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.140.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.140.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.140.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.140.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.140.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.140.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.141.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.141.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.141.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.141.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.141.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.141.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.142.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.142.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.142.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.142.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.142.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.142.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.143.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.143.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.143.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.143.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.143.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.143.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.144.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.144.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.144.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.144.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.144.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.144.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.145.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.145.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.145.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.145.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.145.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.145.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.146.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.146.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.146.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.146.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.146.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.146.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.147.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.147.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.147.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.147.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.147.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.147.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.148.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.148.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.148.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.148.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.148.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.148.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.149.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.149.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.149.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.149.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.149.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.149.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.15.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.15.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.15.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.15.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.15.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.15.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.150.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.150.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.150.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.150.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.150.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.150.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.151.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.151.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.151.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.151.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.151.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.151.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.152.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.152.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.152.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.152.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.152.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.152.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.153.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.153.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.153.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.153.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.153.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.153.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.154.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.154.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.154.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.154.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.154.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.154.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.155.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.155.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.155.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.155.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.155.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.155.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.156.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.156.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.156.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.156.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.156.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.156.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.157.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.157.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.157.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.157.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.157.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.157.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.158.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.158.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.158.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.158.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.158.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.158.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.159.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.159.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.159.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.159.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.159.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.159.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.16.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.16.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.16.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.16.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.16.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.16.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.17.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.17.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.17.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.17.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.17.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.17.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.18.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.18.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.18.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.18.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.18.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.18.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.19.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.19.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.19.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.19.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.19.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.19.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.2.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.2.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.2.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.2.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.2.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.2.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.20.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.20.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.20.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.20.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.20.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.20.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.21.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.21.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.21.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.21.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.21.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.21.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.22.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.22.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.22.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.22.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.22.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.22.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.23.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.23.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.23.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.23.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.23.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.23.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.24.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.24.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.24.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.24.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.24.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.24.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.25.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.25.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.25.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.25.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.25.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.25.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.26.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.26.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.26.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.26.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.26.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.26.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.27.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.27.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.27.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.27.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.27.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.27.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.28.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.28.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.28.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.28.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.28.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.28.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.29.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.29.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.29.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.29.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.29.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.29.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.3.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.3.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.3.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.3.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.3.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.3.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.30.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.30.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.30.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.30.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.30.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.30.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.31.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.31.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.31.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.31.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.31.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.31.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.32.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.32.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.32.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.32.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.32.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.32.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.33.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.33.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.33.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.33.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.33.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.33.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.34.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.34.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.34.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.34.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.34.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.34.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.35.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.35.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.35.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.35.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.35.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.35.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.36.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.36.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.36.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.36.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.36.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.36.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.37.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.37.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.37.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.37.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.37.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.37.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.38.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.38.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.38.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.38.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.38.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.38.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.39.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.39.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.39.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.39.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.39.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.39.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.4.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.4.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.4.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.4.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.4.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.4.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.40.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.40.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.40.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.40.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.40.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.40.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.41.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.41.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.41.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.41.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.41.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.41.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.42.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.42.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.42.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.42.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.42.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.42.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.43.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.43.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.43.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.43.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.43.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.43.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.44.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.44.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.44.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.44.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.44.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.44.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.45.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.45.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.45.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.45.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.45.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.45.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.46.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.46.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.46.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.46.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.46.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.46.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.47.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.47.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.47.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.47.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.47.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.47.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.48.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.48.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.48.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.48.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.48.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.48.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.49.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.49.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.49.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.49.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.49.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.49.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.5.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.5.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.5.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.5.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.5.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.5.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.50.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.50.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.50.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.50.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.50.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.50.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.51.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.51.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.51.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.51.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.51.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.51.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.52.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.52.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.52.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.52.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.52.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.52.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.53.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.53.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.53.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.53.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.53.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.53.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.54.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.54.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.54.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.54.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.54.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.54.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.55.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.55.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.55.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.55.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.55.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.55.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.56.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.56.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.56.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.56.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.56.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.56.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.57.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.57.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.57.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.57.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.57.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.57.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.58.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.58.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.58.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.58.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.58.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.58.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.59.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.59.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.59.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.59.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.59.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.59.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.6.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.6.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.6.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.6.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.6.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.6.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.60.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.60.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.60.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.60.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.60.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.60.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.61.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.61.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.61.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.61.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.61.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.61.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.62.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.62.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.62.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.62.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.62.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.62.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.63.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.63.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.63.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.63.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.63.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.63.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.64.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.64.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.64.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.64.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.64.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.64.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.65.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.65.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.65.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.65.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.65.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.65.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.66.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.66.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.66.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.66.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.66.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.66.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.67.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.67.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.67.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.67.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.67.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.67.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.68.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.68.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.68.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.68.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.68.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.68.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.69.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.69.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.69.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.69.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.69.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.69.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.7.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.7.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.7.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.7.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.7.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.7.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.70.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.70.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.70.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.70.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.70.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.70.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.71.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.71.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.71.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.71.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.71.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.71.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.72.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.72.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.72.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.72.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.72.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.72.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.73.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.73.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.73.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.73.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.73.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.73.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.74.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.74.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.74.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.74.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.74.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.74.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.75.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.75.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.75.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.75.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.75.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.75.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.76.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.76.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.76.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.76.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.76.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.76.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.77.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.77.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.77.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.77.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.77.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.77.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.78.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.78.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.78.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.78.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.78.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.78.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.79.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.79.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.79.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.79.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.79.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.79.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.8.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.8.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.8.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.8.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.8.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.8.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.80.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.80.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.80.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.80.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.80.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.80.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.81.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.81.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.81.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.81.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.81.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.81.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.82.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.82.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.82.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.82.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.82.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.82.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.83.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.83.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.83.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.83.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.83.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.83.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.84.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.84.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.84.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.84.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.84.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.84.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.85.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.85.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.85.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.85.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.85.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.85.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.86.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.86.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.86.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.86.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.86.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.86.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.87.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.87.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.87.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.87.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.87.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.87.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.88.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.88.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.88.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.88.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.88.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.88.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.89.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.89.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.89.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.89.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.89.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.89.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.9.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.9.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.9.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.9.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.9.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.9.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.90.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.90.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.90.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.90.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.90.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.90.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.91.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.91.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.91.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.91.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.91.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.91.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.92.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.92.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.92.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.92.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.92.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.92.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.93.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.93.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.93.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.93.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.93.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.93.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.94.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.94.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.94.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.94.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.94.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.94.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.95.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.95.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.95.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.95.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.95.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.95.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.96.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.96.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.96.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.96.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.96.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.96.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.97.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.97.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.97.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.97.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.97.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.97.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.98.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.98.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.98.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.98.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.98.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.98.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.99.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.99.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.99.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.99.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.99.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.experts.99.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.gate.e_score_correction_bias": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.gate.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.shared_experts.down_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.shared_experts.down_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.shared_experts.gate_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.shared_experts.gate_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.shared_experts.up_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.mlp.shared_experts.up_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.post_attention_layernorm.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.self_attn.k_norm.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.self_attn.k_proj.bias": "model-00012-of-00092.safetensors",
+ "model.layers.11.self_attn.k_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.self_attn.k_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.self_attn.o_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.self_attn.o_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.self_attn.q_norm.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.self_attn.q_proj.bias": "model-00012-of-00092.safetensors",
+ "model.layers.11.self_attn.q_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.self_attn.q_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.11.self_attn.v_proj.bias": "model-00012-of-00092.safetensors",
+ "model.layers.11.self_attn.v_proj.weight": "model-00012-of-00092.safetensors",
+ "model.layers.11.self_attn.v_proj.weight_scale": "model-00012-of-00092.safetensors",
+ "model.layers.12.input_layernorm.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.0.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.0.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.0.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.0.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.0.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.0.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.1.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.1.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.1.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.1.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.1.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.1.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.10.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.10.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.10.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.10.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.10.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.10.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.100.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.100.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.100.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.100.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.100.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.100.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.101.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.101.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.101.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.101.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.101.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.101.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.102.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.102.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.102.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.102.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.102.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.102.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.103.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.103.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.103.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.103.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.103.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.103.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.104.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.104.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.104.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.104.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.104.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.104.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.105.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.105.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.105.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.105.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.105.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.105.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.106.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.106.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.106.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.106.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.106.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.106.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.107.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.107.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.107.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.107.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.107.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.107.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.108.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.108.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.108.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.108.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.108.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.108.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.109.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.109.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.109.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.109.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.109.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.109.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.11.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.11.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.11.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.11.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.11.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.11.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.110.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.110.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.110.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.110.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.110.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.110.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.111.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.111.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.111.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.111.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.111.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.111.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.112.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.112.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.112.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.112.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.112.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.112.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.113.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.113.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.113.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.113.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.113.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.113.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.114.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.114.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.114.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.114.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.114.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.114.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.115.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.115.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.115.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.115.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.115.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.115.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.116.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.116.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.116.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.116.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.116.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.116.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.117.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.117.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.117.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.117.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.117.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.117.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.118.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.118.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.118.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.118.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.118.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.118.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.119.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.119.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.119.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.119.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.119.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.119.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.12.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.12.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.12.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.12.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.12.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.12.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.120.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.120.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.120.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.120.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.120.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.120.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.121.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.121.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.121.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.121.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.121.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.121.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.122.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.122.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.122.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.122.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.122.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.122.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.123.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.123.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.123.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.123.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.123.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.123.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.124.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.124.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.124.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.124.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.124.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.124.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.125.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.125.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.125.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.125.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.125.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.125.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.126.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.126.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.126.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.126.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.126.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.126.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.127.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.127.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.127.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.127.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.127.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.127.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.128.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.128.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.128.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.128.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.128.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.128.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.129.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.129.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.129.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.129.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.129.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.129.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.13.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.13.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.13.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.13.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.13.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.13.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.130.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.130.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.130.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.130.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.130.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.130.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.131.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.131.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.131.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.131.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.131.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.131.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.132.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.132.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.132.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.132.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.132.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.132.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.133.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.133.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.133.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.133.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.133.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.133.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.134.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.134.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.134.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.134.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.134.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.134.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.135.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.135.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.135.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.135.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.135.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.135.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.136.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.136.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.136.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.136.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.136.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.136.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.137.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.137.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.137.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.137.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.137.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.137.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.138.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.138.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.138.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.138.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.138.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.138.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.139.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.139.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.139.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.139.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.139.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.139.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.14.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.14.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.14.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.14.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.14.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.14.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.140.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.140.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.140.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.140.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.140.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.140.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.141.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.141.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.141.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.141.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.141.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.141.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.142.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.142.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.142.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.142.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.142.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.142.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.143.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.143.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.143.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.143.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.143.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.143.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.144.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.144.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.144.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.144.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.144.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.144.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.145.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.145.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.145.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.145.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.145.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.145.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.146.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.146.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.146.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.146.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.146.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.146.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.147.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.147.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.147.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.147.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.147.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.147.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.148.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.148.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.148.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.148.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.148.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.148.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.149.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.149.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.149.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.149.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.149.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.149.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.15.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.15.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.15.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.15.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.15.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.15.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.150.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.150.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.150.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.150.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.150.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.150.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.151.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.151.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.151.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.151.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.151.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.151.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.152.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.152.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.152.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.152.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.152.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.152.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.153.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.153.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.153.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.153.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.153.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.153.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.154.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.154.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.154.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.154.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.154.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.154.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.155.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.155.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.155.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.155.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.155.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.155.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.156.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.156.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.156.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.156.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.156.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.156.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.157.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.157.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.157.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.157.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.157.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.157.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.158.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.158.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.158.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.158.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.158.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.158.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.159.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.159.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.159.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.159.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.159.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.159.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.16.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.16.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.16.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.16.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.16.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.16.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.17.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.17.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.17.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.17.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.17.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.17.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.18.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.18.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.18.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.18.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.18.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.18.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.19.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.19.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.19.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.19.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.19.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.19.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.2.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.2.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.2.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.2.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.2.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.2.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.20.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.20.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.20.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.20.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.20.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.20.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.21.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.21.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.21.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.21.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.21.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.21.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.22.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.22.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.22.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.22.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.22.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.22.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.23.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.23.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.23.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.23.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.23.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.23.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.24.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.24.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.24.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.24.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.24.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.24.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.25.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.25.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.25.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.25.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.25.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.25.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.26.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.26.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.26.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.26.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.26.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.26.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.27.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.27.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.27.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.27.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.27.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.27.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.28.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.28.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.28.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.28.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.28.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.28.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.29.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.29.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.29.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.29.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.29.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.29.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.3.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.3.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.3.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.3.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.3.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.3.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.30.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.30.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.30.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.30.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.30.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.30.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.31.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.31.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.31.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.31.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.31.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.31.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.32.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.32.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.32.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.32.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.32.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.32.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.33.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.33.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.33.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.33.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.33.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.33.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.34.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.34.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.34.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.34.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.34.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.34.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.35.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.35.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.35.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.35.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.35.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.35.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.36.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.36.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.36.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.36.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.36.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.36.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.37.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.37.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.37.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.37.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.37.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.37.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.38.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.38.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.38.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.38.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.38.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.38.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.39.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.39.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.39.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.39.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.39.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.39.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.4.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.4.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.4.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.4.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.4.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.4.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.40.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.40.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.40.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.40.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.40.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.40.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.41.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.41.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.41.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.41.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.41.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.41.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.42.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.42.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.42.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.42.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.42.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.42.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.43.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.43.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.43.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.43.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.43.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.43.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.44.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.44.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.44.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.44.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.44.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.44.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.45.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.45.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.45.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.45.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.45.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.45.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.46.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.46.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.46.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.46.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.46.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.46.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.47.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.47.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.47.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.47.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.47.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.47.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.48.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.48.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.48.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.48.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.48.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.48.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.49.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.49.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.49.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.49.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.49.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.49.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.5.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.5.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.5.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.5.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.5.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.5.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.50.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.50.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.50.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.50.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.50.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.50.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.51.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.51.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.51.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.51.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.51.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.51.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.52.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.52.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.52.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.52.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.52.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.52.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.53.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.53.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.53.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.53.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.53.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.53.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.54.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.54.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.54.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.54.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.54.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.54.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.55.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.55.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.55.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.55.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.55.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.55.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.56.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.56.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.56.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.56.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.56.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.56.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.57.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.57.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.57.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.57.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.57.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.57.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.58.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.58.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.58.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.58.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.58.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.58.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.59.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.59.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.59.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.59.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.59.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.59.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.6.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.6.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.6.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.6.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.6.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.6.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.60.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.60.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.60.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.60.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.60.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.60.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.61.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.61.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.61.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.61.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.61.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.61.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.62.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.62.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.62.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.62.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.62.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.62.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.63.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.63.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.63.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.63.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.63.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.63.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.64.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.64.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.64.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.64.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.64.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.64.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.65.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.65.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.65.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.65.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.65.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.65.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.66.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.66.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.66.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.66.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.66.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.66.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.67.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.67.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.67.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.67.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.67.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.67.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.68.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.68.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.68.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.68.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.68.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.68.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.69.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.69.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.69.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.69.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.69.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.69.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.7.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.7.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.7.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.7.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.7.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.7.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.70.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.70.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.70.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.70.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.70.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.70.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.71.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.71.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.71.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.71.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.71.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.71.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.72.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.72.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.72.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.72.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.72.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.72.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.73.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.73.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.73.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.73.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.73.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.73.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.74.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.74.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.74.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.74.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.74.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.74.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.75.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.75.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.75.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.75.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.75.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.75.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.76.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.76.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.76.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.76.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.76.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.76.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.77.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.77.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.77.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.77.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.77.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.77.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.78.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.78.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.78.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.78.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.78.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.78.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.79.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.79.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.79.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.79.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.79.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.79.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.8.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.8.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.8.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.8.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.8.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.8.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.80.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.80.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.80.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.80.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.80.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.80.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.81.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.81.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.81.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.81.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.81.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.81.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.82.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.82.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.82.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.82.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.82.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.82.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.83.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.83.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.83.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.83.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.83.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.83.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.84.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.84.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.84.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.84.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.84.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.84.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.85.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.85.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.85.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.85.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.85.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.85.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.86.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.86.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.86.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.86.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.86.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.86.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.87.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.87.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.87.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.87.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.87.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.87.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.88.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.88.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.88.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.88.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.88.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.88.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.89.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.89.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.89.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.89.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.89.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.89.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.9.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.9.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.9.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.9.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.9.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.9.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.90.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.90.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.90.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.90.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.90.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.90.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.91.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.91.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.91.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.91.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.91.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.91.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.92.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.92.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.92.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.92.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.92.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.92.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.93.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.93.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.93.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.93.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.93.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.93.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.94.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.94.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.94.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.94.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.94.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.94.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.95.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.95.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.95.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.95.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.95.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.95.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.96.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.96.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.96.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.96.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.96.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.96.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.97.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.97.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.97.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.97.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.97.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.97.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.98.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.98.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.98.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.98.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.98.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.98.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.99.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.99.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.99.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.99.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.99.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.experts.99.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.gate.e_score_correction_bias": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.gate.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.shared_experts.down_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.shared_experts.down_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.shared_experts.gate_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.shared_experts.gate_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.shared_experts.up_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.mlp.shared_experts.up_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.post_attention_layernorm.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.self_attn.k_norm.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.self_attn.k_proj.bias": "model-00013-of-00092.safetensors",
+ "model.layers.12.self_attn.k_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.self_attn.k_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.self_attn.o_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.self_attn.o_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.self_attn.q_norm.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.self_attn.q_proj.bias": "model-00013-of-00092.safetensors",
+ "model.layers.12.self_attn.q_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.self_attn.q_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.12.self_attn.v_proj.bias": "model-00013-of-00092.safetensors",
+ "model.layers.12.self_attn.v_proj.weight": "model-00013-of-00092.safetensors",
+ "model.layers.12.self_attn.v_proj.weight_scale": "model-00013-of-00092.safetensors",
+ "model.layers.13.input_layernorm.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.0.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.0.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.0.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.0.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.0.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.0.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.1.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.1.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.1.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.1.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.1.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.1.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.10.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.10.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.10.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.10.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.10.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.10.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.100.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.100.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.100.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.100.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.100.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.100.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.101.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.101.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.101.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.101.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.101.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.101.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.102.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.102.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.102.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.102.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.102.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.102.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.103.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.103.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.103.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.103.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.103.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.103.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.104.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.104.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.104.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.104.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.104.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.104.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.105.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.105.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.105.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.105.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.105.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.105.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.106.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.106.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.106.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.106.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.106.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.106.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.107.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.107.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.107.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.107.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.107.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.107.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.108.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.108.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.108.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.108.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.108.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.108.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.109.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.109.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.109.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.109.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.109.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.109.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.11.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.11.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.11.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.11.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.11.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.11.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.110.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.110.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.110.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.110.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.110.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.110.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.111.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.111.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.111.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.111.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.111.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.111.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.112.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.112.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.112.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.112.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.112.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.112.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.113.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.113.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.113.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.113.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.113.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.113.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.114.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.114.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.114.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.114.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.114.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.114.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.115.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.115.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.115.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.115.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.115.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.115.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.116.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.116.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.116.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.116.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.116.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.116.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.117.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.117.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.117.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.117.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.117.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.117.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.118.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.118.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.118.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.118.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.118.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.118.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.119.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.119.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.119.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.119.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.119.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.119.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.12.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.12.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.12.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.12.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.12.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.12.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.120.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.120.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.120.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.120.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.120.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.120.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.121.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.121.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.121.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.121.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.121.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.121.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.122.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.122.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.122.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.122.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.122.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.122.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.123.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.123.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.123.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.123.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.123.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.123.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.124.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.124.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.124.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.124.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.124.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.124.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.125.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.125.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.125.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.125.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.125.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.125.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.126.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.126.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.126.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.126.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.126.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.126.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.127.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.127.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.127.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.127.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.127.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.127.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.128.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.128.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.128.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.128.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.128.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.128.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.129.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.129.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.129.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.129.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.129.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.129.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.13.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.13.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.13.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.13.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.13.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.13.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.130.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.130.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.130.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.130.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.130.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.130.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.131.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.131.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.131.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.131.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.131.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.131.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.132.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.132.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.132.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.132.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.132.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.132.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.133.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.133.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.133.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.133.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.133.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.133.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.134.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.134.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.134.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.134.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.134.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.134.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.135.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.135.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.135.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.135.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.135.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.135.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.136.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.136.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.136.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.136.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.136.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.136.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.137.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.137.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.137.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.137.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.137.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.137.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.138.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.138.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.138.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.138.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.138.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.138.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.139.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.139.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.139.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.139.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.139.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.139.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.14.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.14.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.14.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.14.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.14.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.14.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.140.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.140.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.140.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.140.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.140.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.140.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.141.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.141.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.141.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.141.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.141.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.141.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.142.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.142.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.142.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.142.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.142.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.142.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.143.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.143.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.143.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.143.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.143.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.143.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.144.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.144.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.144.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.144.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.144.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.144.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.145.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.145.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.145.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.145.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.145.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.145.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.146.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.146.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.146.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.146.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.146.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.146.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.147.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.147.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.147.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.147.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.147.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.147.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.148.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.148.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.148.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.148.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.148.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.148.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.149.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.149.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.149.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.149.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.149.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.149.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.15.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.15.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.15.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.15.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.15.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.15.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.150.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.150.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.150.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.150.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.150.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.150.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.151.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.151.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.151.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.151.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.151.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.151.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.152.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.152.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.152.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.152.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.152.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.152.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.153.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.153.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.153.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.153.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.153.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.153.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.154.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.154.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.154.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.154.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.154.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.154.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.155.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.155.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.155.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.155.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.155.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.155.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.156.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.156.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.156.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.156.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.156.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.156.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.157.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.157.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.157.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.157.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.157.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.157.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.158.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.158.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.158.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.158.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.158.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.158.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.159.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.159.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.159.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.159.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.159.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.159.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.16.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.16.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.16.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.16.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.16.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.16.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.17.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.17.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.17.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.17.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.17.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.17.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.18.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.18.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.18.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.18.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.18.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.18.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.19.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.19.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.19.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.19.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.19.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.19.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.2.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.2.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.2.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.2.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.2.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.2.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.20.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.20.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.20.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.20.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.20.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.20.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.21.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.21.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.21.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.21.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.21.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.21.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.22.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.22.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.22.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.22.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.22.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.22.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.23.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.23.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.23.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.23.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.23.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.23.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.24.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.24.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.24.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.24.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.24.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.24.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.25.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.25.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.25.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.25.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.25.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.25.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.26.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.26.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.26.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.26.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.26.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.26.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.27.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.27.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.27.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.27.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.27.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.27.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.28.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.28.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.28.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.28.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.28.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.28.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.29.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.29.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.29.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.29.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.29.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.29.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.3.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.3.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.3.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.3.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.3.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.3.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.30.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.30.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.30.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.30.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.30.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.30.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.31.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.31.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.31.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.31.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.31.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.31.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.32.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.32.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.32.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.32.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.32.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.32.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.33.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.33.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.33.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.33.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.33.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.33.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.34.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.34.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.34.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.34.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.34.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.34.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.35.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.35.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.35.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.35.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.35.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.35.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.36.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.36.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.36.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.36.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.36.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.36.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.37.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.37.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.37.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.37.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.37.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.37.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.38.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.38.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.38.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.38.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.38.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.38.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.39.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.39.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.39.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.39.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.39.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.39.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.4.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.4.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.4.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.4.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.4.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.4.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.40.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.40.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.40.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.40.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.40.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.40.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.41.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.41.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.41.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.41.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.41.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.41.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.42.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.42.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.42.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.42.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.42.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.42.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.43.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.43.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.43.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.43.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.43.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.43.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.44.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.44.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.44.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.44.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.44.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.44.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.45.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.45.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.45.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.45.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.45.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.45.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.46.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.46.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.46.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.46.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.46.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.46.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.47.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.47.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.47.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.47.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.47.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.47.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.48.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.48.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.48.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.48.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.48.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.48.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.49.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.49.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.49.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.49.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.49.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.49.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.5.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.5.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.5.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.5.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.5.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.5.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.50.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.50.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.50.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.50.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.50.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.50.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.51.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.51.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.51.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.51.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.51.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.51.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.52.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.52.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.52.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.52.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.52.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.52.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.53.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.53.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.53.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.53.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.53.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.53.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.54.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.54.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.54.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.54.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.54.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.54.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.55.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.55.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.55.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.55.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.55.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.55.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.56.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.56.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.56.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.56.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.56.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.56.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.57.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.57.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.57.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.57.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.57.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.57.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.58.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.58.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.58.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.58.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.58.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.58.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.59.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.59.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.59.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.59.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.59.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.59.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.6.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.6.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.6.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.6.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.6.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.6.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.60.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.60.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.60.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.60.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.60.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.60.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.61.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.61.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.61.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.61.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.61.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.61.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.62.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.62.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.62.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.62.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.62.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.62.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.63.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.63.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.63.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.63.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.63.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.63.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.64.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.64.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.64.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.64.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.64.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.64.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.65.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.65.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.65.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.65.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.65.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.65.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.66.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.66.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.66.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.66.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.66.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.66.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.67.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.67.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.67.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.67.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.67.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.67.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.68.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.68.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.68.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.68.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.68.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.68.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.69.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.69.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.69.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.69.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.69.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.69.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.7.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.7.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.7.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.7.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.7.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.7.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.70.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.70.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.70.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.70.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.70.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.70.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.71.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.71.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.71.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.71.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.71.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.71.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.72.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.72.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.72.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.72.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.72.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.72.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.73.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.73.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.73.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.73.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.73.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.73.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.74.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.74.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.74.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.74.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.74.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.74.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.75.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.75.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.75.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.75.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.75.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.75.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.76.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.76.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.76.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.76.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.76.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.76.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.77.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.77.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.77.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.77.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.77.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.77.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.78.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.78.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.78.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.78.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.78.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.78.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.79.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.79.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.79.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.79.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.79.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.79.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.8.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.8.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.8.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.8.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.8.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.8.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.80.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.80.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.80.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.80.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.80.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.80.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.81.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.81.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.81.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.81.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.81.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.81.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.82.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.82.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.82.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.82.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.82.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.82.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.83.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.83.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.83.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.83.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.83.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.83.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.84.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.84.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.84.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.84.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.84.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.84.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.85.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.85.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.85.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.85.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.85.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.85.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.86.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.86.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.86.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.86.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.86.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.86.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.87.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.87.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.87.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.87.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.87.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.87.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.88.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.88.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.88.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.88.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.88.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.88.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.89.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.89.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.89.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.89.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.89.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.89.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.9.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.9.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.9.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.9.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.9.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.9.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.90.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.90.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.90.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.90.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.90.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.90.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.91.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.91.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.91.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.91.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.91.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.91.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.92.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.92.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.92.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.92.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.92.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.92.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.93.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.93.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.93.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.93.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.93.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.93.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.94.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.94.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.94.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.94.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.94.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.94.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.95.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.95.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.95.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.95.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.95.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.95.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.96.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.96.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.96.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.96.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.96.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.96.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.97.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.97.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.97.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.97.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.97.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.97.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.98.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.98.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.98.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.98.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.98.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.98.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.99.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.99.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.99.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.99.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.99.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.experts.99.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.gate.e_score_correction_bias": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.gate.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.shared_experts.down_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.shared_experts.down_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.shared_experts.gate_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.shared_experts.gate_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.shared_experts.up_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.mlp.shared_experts.up_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.post_attention_layernorm.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.self_attn.k_norm.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.self_attn.k_proj.bias": "model-00014-of-00092.safetensors",
+ "model.layers.13.self_attn.k_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.self_attn.k_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.self_attn.o_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.self_attn.o_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.self_attn.q_norm.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.self_attn.q_proj.bias": "model-00014-of-00092.safetensors",
+ "model.layers.13.self_attn.q_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.self_attn.q_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.13.self_attn.v_proj.bias": "model-00014-of-00092.safetensors",
+ "model.layers.13.self_attn.v_proj.weight": "model-00014-of-00092.safetensors",
+ "model.layers.13.self_attn.v_proj.weight_scale": "model-00014-of-00092.safetensors",
+ "model.layers.14.input_layernorm.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.0.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.0.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.0.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.0.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.0.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.0.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.1.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.1.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.1.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.1.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.1.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.1.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.10.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.10.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.10.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.10.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.10.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.10.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.100.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.100.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.100.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.100.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.100.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.100.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.101.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.101.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.101.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.101.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.101.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.101.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.102.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.102.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.102.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.102.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.102.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.102.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.103.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.103.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.103.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.103.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.103.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.103.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.104.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.104.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.104.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.104.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.104.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.104.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.105.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.105.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.105.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.105.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.105.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.105.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.106.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.106.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.106.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.106.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.106.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.106.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.107.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.107.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.107.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.107.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.107.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.107.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.108.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.108.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.108.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.108.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.108.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.108.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.109.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.109.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.109.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.109.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.109.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.109.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.11.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.11.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.11.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.11.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.11.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.11.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.110.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.110.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.110.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.110.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.110.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.110.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.111.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.111.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.111.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.111.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.111.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.111.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.112.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.112.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.112.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.112.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.112.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.112.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.113.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.113.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.113.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.113.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.113.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.113.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.114.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.114.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.114.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.114.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.114.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.114.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.115.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.115.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.115.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.115.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.115.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.115.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.116.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.116.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.116.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.116.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.116.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.116.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.117.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.117.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.117.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.117.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.117.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.117.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.118.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.118.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.118.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.118.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.118.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.118.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.119.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.119.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.119.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.119.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.119.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.119.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.12.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.12.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.12.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.12.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.12.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.12.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.120.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.120.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.120.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.120.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.120.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.120.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.121.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.121.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.121.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.121.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.121.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.121.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.122.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.122.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.122.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.122.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.122.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.122.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.123.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.123.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.123.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.123.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.123.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.123.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.124.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.124.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.124.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.124.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.124.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.124.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.125.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.125.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.125.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.125.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.125.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.125.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.126.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.126.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.126.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.126.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.126.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.126.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.127.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.127.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.127.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.127.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.127.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.127.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.128.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.128.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.128.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.128.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.128.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.128.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.129.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.129.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.129.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.129.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.129.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.129.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.13.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.13.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.13.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.13.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.13.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.13.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.130.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.130.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.130.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.130.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.130.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.130.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.131.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.131.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.131.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.131.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.131.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.131.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.132.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.132.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.132.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.132.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.132.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.132.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.133.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.133.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.133.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.133.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.133.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.133.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.134.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.134.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.134.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.134.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.134.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.134.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.135.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.135.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.135.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.135.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.135.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.135.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.136.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.136.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.136.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.136.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.136.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.136.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.137.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.137.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.137.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.137.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.137.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.137.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.138.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.138.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.138.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.138.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.138.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.138.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.139.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.139.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.139.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.139.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.139.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.139.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.14.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.14.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.14.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.14.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.14.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.14.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.140.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.140.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.140.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.140.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.140.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.140.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.141.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.141.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.141.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.141.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.141.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.141.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.142.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.142.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.142.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.142.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.142.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.142.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.143.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.143.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.143.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.143.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.143.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.143.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.144.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.144.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.144.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.144.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.144.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.144.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.145.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.145.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.145.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.145.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.145.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.145.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.146.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.146.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.146.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.146.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.146.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.146.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.147.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.147.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.147.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.147.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.147.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.147.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.148.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.148.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.148.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.148.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.148.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.148.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.149.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.149.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.149.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.149.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.149.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.149.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.15.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.15.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.15.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.15.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.15.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.15.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.150.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.150.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.150.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.150.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.150.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.150.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.151.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.151.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.151.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.151.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.151.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.151.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.152.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.152.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.152.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.152.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.152.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.152.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.153.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.153.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.153.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.153.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.153.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.153.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.154.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.154.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.154.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.154.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.154.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.154.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.155.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.155.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.155.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.155.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.155.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.155.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.156.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.156.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.156.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.156.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.156.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.156.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.157.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.157.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.157.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.157.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.157.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.157.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.158.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.158.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.158.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.158.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.158.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.158.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.159.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.159.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.159.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.159.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.159.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.159.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.16.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.16.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.16.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.16.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.16.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.16.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.17.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.17.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.17.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.17.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.17.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.17.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.18.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.18.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.18.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.18.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.18.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.18.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.19.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.19.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.19.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.19.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.19.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.19.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.2.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.2.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.2.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.2.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.2.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.2.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.20.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.20.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.20.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.20.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.20.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.20.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.21.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.21.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.21.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.21.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.21.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.21.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.22.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.22.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.22.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.22.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.22.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.22.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.23.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.23.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.23.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.23.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.23.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.23.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.24.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.24.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.24.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.24.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.24.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.24.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.25.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.25.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.25.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.25.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.25.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.25.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.26.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.26.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.26.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.26.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.26.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.26.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.27.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.27.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.27.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.27.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.27.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.27.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.28.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.28.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.28.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.28.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.28.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.28.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.29.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.29.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.29.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.29.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.29.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.29.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.3.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.3.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.3.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.3.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.3.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.3.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.30.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.30.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.30.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.30.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.30.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.30.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.31.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.31.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.31.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.31.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.31.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.31.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.32.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.32.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.32.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.32.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.32.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.32.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.33.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.33.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.33.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.33.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.33.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.33.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.34.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.34.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.34.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.34.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.34.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.34.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.35.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.35.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.35.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.35.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.35.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.35.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.36.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.36.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.36.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.36.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.36.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.36.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.37.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.37.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.37.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.37.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.37.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.37.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.38.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.38.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.38.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.38.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.38.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.38.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.39.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.39.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.39.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.39.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.39.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.39.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.4.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.4.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.4.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.4.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.4.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.4.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.40.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.40.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.40.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.40.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.40.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.40.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.41.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.41.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.41.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.41.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.41.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.41.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.42.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.42.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.42.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.42.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.42.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.42.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.43.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.43.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.43.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.43.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.43.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.43.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.44.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.44.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.44.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.44.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.44.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.44.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.45.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.45.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.45.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.45.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.45.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.45.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.46.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.46.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.46.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.46.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.46.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.46.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.47.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.47.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.47.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.47.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.47.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.47.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.48.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.48.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.48.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.48.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.48.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.48.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.49.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.49.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.49.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.49.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.49.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.49.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.5.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.5.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.5.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.5.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.5.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.5.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.50.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.50.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.50.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.50.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.50.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.50.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.51.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.51.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.51.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.51.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.51.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.51.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.52.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.52.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.52.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.52.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.52.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.52.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.53.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.53.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.53.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.53.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.53.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.53.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.54.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.54.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.54.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.54.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.54.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.54.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.55.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.55.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.55.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.55.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.55.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.55.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.56.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.56.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.56.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.56.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.56.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.56.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.57.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.57.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.57.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.57.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.57.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.57.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.58.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.58.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.58.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.58.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.58.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.58.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.59.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.59.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.59.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.59.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.59.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.59.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.6.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.6.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.6.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.6.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.6.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.6.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.60.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.60.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.60.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.60.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.60.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.60.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.61.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.61.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.61.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.61.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.61.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.61.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.62.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.62.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.62.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.62.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.62.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.62.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.63.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.63.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.63.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.63.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.63.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.63.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.64.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.64.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.64.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.64.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.64.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.64.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.65.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.65.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.65.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.65.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.65.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.65.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.66.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.66.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.66.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.66.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.66.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.66.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.67.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.67.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.67.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.67.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.67.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.67.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.68.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.68.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.68.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.68.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.68.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.68.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.69.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.69.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.69.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.69.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.69.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.69.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.7.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.7.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.7.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.7.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.7.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.7.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.70.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.70.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.70.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.70.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.70.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.70.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.71.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.71.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.71.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.71.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.71.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.71.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.72.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.72.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.72.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.72.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.72.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.72.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.73.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.73.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.73.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.73.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.73.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.73.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.74.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.74.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.74.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.74.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.74.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.74.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.75.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.75.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.75.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.75.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.75.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.75.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.76.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.76.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.76.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.76.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.76.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.76.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.77.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.77.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.77.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.77.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.77.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.77.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.78.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.78.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.78.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.78.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.78.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.78.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.79.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.79.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.79.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.79.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.79.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.79.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.8.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.8.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.8.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.8.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.8.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.8.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.80.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.80.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.80.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.80.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.80.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.80.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.81.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.81.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.81.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.81.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.81.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.81.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.82.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.82.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.82.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.82.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.82.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.82.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.83.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.83.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.83.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.83.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.83.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.83.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.84.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.84.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.84.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.84.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.84.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.84.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.85.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.85.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.85.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.85.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.85.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.85.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.86.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.86.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.86.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.86.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.86.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.86.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.87.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.87.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.87.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.87.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.87.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.87.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.88.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.88.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.88.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.88.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.88.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.88.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.89.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.89.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.89.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.89.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.89.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.89.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.9.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.9.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.9.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.9.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.9.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.9.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.90.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.90.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.90.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.90.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.90.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.90.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.91.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.91.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.91.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.91.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.91.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.91.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.92.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.92.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.92.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.92.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.92.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.92.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.93.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.93.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.93.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.93.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.93.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.93.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.94.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.94.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.94.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.94.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.94.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.94.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.95.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.95.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.95.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.95.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.95.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.95.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.96.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.96.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.96.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.96.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.96.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.96.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.97.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.97.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.97.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.97.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.97.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.97.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.98.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.98.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.98.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.98.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.98.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.98.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.99.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.99.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.99.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.99.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.99.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.experts.99.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.gate.e_score_correction_bias": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.gate.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.shared_experts.down_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.shared_experts.down_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.shared_experts.gate_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.shared_experts.gate_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.shared_experts.up_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.mlp.shared_experts.up_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.post_attention_layernorm.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.self_attn.k_norm.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.self_attn.k_proj.bias": "model-00015-of-00092.safetensors",
+ "model.layers.14.self_attn.k_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.self_attn.k_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.self_attn.o_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.self_attn.o_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.self_attn.q_norm.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.self_attn.q_proj.bias": "model-00015-of-00092.safetensors",
+ "model.layers.14.self_attn.q_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.self_attn.q_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.14.self_attn.v_proj.bias": "model-00015-of-00092.safetensors",
+ "model.layers.14.self_attn.v_proj.weight": "model-00015-of-00092.safetensors",
+ "model.layers.14.self_attn.v_proj.weight_scale": "model-00015-of-00092.safetensors",
+ "model.layers.15.input_layernorm.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.0.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.0.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.0.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.0.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.0.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.0.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.1.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.1.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.1.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.1.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.1.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.1.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.10.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.10.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.10.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.10.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.10.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.10.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.100.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.100.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.100.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.100.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.100.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.100.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.101.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.101.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.101.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.101.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.101.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.101.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.102.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.102.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.102.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.102.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.102.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.102.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.103.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.103.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.103.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.103.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.103.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.103.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.104.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.104.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.104.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.104.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.104.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.104.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.105.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.105.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.105.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.105.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.105.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.105.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.106.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.106.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.106.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.106.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.106.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.106.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.107.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.107.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.107.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.107.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.107.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.107.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.108.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.108.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.108.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.108.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.108.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.108.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.109.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.109.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.109.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.109.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.109.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.109.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.11.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.11.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.11.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.11.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.11.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.11.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.110.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.110.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.110.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.110.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.110.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.110.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.111.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.111.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.111.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.111.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.111.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.111.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.112.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.112.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.112.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.112.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.112.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.112.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.113.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.113.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.113.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.113.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.113.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.113.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.114.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.114.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.114.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.114.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.114.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.114.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.115.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.115.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.115.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.115.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.115.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.115.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.116.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.116.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.116.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.116.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.116.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.116.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.117.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.117.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.117.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.117.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.117.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.117.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.118.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.118.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.118.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.118.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.118.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.118.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.119.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.119.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.119.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.119.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.119.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.119.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.12.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.12.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.12.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.12.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.12.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.12.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.120.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.120.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.120.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.120.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.120.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.120.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.121.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.121.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.121.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.121.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.121.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.121.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.122.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.122.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.122.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.122.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.122.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.122.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.123.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.123.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.123.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.123.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.123.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.123.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.124.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.124.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.124.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.124.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.124.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.124.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.125.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.125.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.125.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.125.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.125.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.125.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.126.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.126.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.126.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.126.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.126.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.126.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.127.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.127.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.127.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.127.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.127.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.127.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.128.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.128.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.128.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.128.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.128.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.128.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.129.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.129.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.129.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.129.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.129.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.129.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.13.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.13.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.13.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.13.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.13.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.13.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.130.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.130.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.130.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.130.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.130.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.130.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.131.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.131.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.131.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.131.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.131.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.131.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.132.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.132.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.132.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.132.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.132.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.132.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.133.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.133.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.133.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.133.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.133.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.133.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.134.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.134.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.134.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.134.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.134.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.134.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.135.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.135.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.135.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.135.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.135.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.135.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.136.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.136.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.136.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.136.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.136.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.136.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.137.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.137.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.137.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.137.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.137.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.137.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.138.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.138.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.138.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.138.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.138.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.138.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.139.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.139.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.139.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.139.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.139.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.139.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.14.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.14.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.14.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.14.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.14.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.14.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.140.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.140.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.140.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.140.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.140.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.140.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.141.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.141.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.141.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.141.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.141.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.141.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.142.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.142.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.142.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.142.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.142.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.142.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.143.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.143.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.143.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.143.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.143.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.143.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.144.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.144.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.144.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.144.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.144.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.144.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.145.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.145.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.145.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.145.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.145.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.145.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.146.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.146.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.146.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.146.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.146.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.146.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.147.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.147.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.147.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.147.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.147.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.147.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.148.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.148.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.148.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.148.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.148.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.148.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.149.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.149.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.149.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.149.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.149.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.149.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.15.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.15.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.15.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.15.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.15.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.15.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.150.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.150.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.150.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.150.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.150.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.150.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.151.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.151.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.151.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.151.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.151.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.151.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.152.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.152.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.152.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.152.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.152.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.152.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.153.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.153.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.153.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.153.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.153.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.153.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.154.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.154.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.154.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.154.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.154.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.154.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.155.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.155.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.155.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.155.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.155.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.155.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.156.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.156.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.156.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.156.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.156.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.156.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.157.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.157.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.157.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.157.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.157.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.157.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.158.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.158.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.158.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.158.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.158.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.158.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.159.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.159.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.159.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.159.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.159.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.159.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.16.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.16.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.16.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.16.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.16.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.16.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.17.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.17.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.17.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.17.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.17.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.17.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.18.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.18.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.18.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.18.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.18.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.18.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.19.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.19.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.19.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.19.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.19.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.19.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.2.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.2.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.2.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.2.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.2.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.2.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.20.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.20.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.20.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.20.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.20.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.20.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.21.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.21.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.21.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.21.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.21.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.21.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.22.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.22.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.22.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.22.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.22.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.22.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.23.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.23.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.23.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.23.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.23.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.23.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.24.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.24.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.24.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.24.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.24.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.24.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.25.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.25.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.25.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.25.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.25.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.25.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.26.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.26.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.26.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.26.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.26.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.26.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.27.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.27.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.27.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.27.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.27.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.27.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.28.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.28.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.28.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.28.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.28.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.28.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.29.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.29.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.29.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.29.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.29.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.29.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.3.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.3.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.3.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.3.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.3.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.3.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.30.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.30.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.30.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.30.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.30.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.30.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.31.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.31.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.31.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.31.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.31.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.31.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.32.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.32.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.32.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.32.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.32.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.32.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.33.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.33.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.33.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.33.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.33.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.33.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.34.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.34.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.34.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.34.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.34.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.34.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.35.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.35.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.35.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.35.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.35.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.35.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.36.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.36.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.36.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.36.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.36.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.36.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.37.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.37.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.37.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.37.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.37.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.37.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.38.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.38.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.38.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.38.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.38.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.38.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.39.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.39.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.39.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.39.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.39.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.39.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.4.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.4.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.4.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.4.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.4.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.4.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.40.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.40.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.40.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.40.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.40.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.40.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.41.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.41.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.41.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.41.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.41.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.41.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.42.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.42.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.42.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.42.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.42.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.42.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.43.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.43.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.43.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.43.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.43.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.43.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.44.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.44.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.44.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.44.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.44.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.44.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.45.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.45.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.45.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.45.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.45.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.45.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.46.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.46.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.46.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.46.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.46.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.46.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.47.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.47.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.47.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.47.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.47.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.47.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.48.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.48.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.48.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.48.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.48.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.48.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.49.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.49.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.49.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.49.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.49.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.49.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.5.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.5.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.5.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.5.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.5.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.5.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.50.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.50.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.50.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.50.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.50.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.50.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.51.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.51.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.51.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.51.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.51.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.51.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.52.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.52.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.52.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.52.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.52.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.52.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.53.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.53.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.53.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.53.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.53.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.53.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.54.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.54.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.54.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.54.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.54.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.54.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.55.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.55.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.55.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.55.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.55.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.55.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.56.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.56.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.56.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.56.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.56.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.56.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.57.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.57.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.57.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.57.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.57.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.57.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.58.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.58.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.58.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.58.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.58.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.58.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.59.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.59.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.59.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.59.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.59.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.59.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.6.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.6.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.6.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.6.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.6.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.6.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.60.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.60.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.60.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.60.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.60.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.60.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.61.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.61.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.61.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.61.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.61.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.61.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.62.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.62.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.62.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.62.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.62.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.62.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.63.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.63.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.63.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.63.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.63.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.63.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.64.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.64.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.64.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.64.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.64.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.64.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.65.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.65.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.65.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.65.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.65.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.65.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.66.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.66.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.66.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.66.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.66.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.66.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.67.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.67.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.67.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.67.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.67.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.67.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.68.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.68.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.68.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.68.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.68.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.68.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.69.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.69.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.69.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.69.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.69.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.69.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.7.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.7.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.7.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.7.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.7.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.7.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.70.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.70.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.70.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.70.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.70.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.70.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.71.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.71.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.71.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.71.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.71.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.71.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.72.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.72.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.72.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.72.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.72.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.72.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.73.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.73.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.73.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.73.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.73.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.73.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.74.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.74.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.74.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.74.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.74.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.74.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.75.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.75.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.75.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.75.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.75.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.75.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.76.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.76.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.76.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.76.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.76.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.76.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.77.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.77.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.77.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.77.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.77.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.77.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.78.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.78.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.78.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.78.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.78.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.78.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.79.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.79.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.79.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.79.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.79.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.79.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.8.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.8.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.8.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.8.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.8.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.8.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.80.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.80.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.80.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.80.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.80.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.80.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.81.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.81.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.81.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.81.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.81.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.81.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.82.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.82.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.82.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.82.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.82.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.82.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.83.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.83.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.83.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.83.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.83.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.83.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.84.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.84.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.84.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.84.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.84.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.84.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.85.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.85.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.85.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.85.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.85.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.85.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.86.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.86.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.86.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.86.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.86.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.86.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.87.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.87.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.87.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.87.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.87.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.87.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.88.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.88.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.88.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.88.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.88.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.88.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.89.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.89.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.89.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.89.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.89.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.89.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.9.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.9.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.9.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.9.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.9.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.9.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.90.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.90.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.90.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.90.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.90.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.90.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.91.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.91.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.91.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.91.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.91.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.91.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.92.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.92.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.92.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.92.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.92.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.92.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.93.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.93.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.93.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.93.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.93.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.93.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.94.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.94.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.94.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.94.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.94.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.94.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.95.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.95.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.95.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.95.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.95.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.95.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.96.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.96.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.96.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.96.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.96.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.96.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.97.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.97.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.97.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.97.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.97.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.97.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.98.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.98.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.98.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.98.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.98.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.98.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.99.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.99.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.99.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.99.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.99.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.experts.99.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.gate.e_score_correction_bias": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.gate.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.shared_experts.down_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.shared_experts.down_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.shared_experts.gate_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.shared_experts.gate_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.shared_experts.up_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.mlp.shared_experts.up_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.post_attention_layernorm.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.self_attn.k_norm.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.self_attn.k_proj.bias": "model-00016-of-00092.safetensors",
+ "model.layers.15.self_attn.k_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.self_attn.k_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.self_attn.o_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.self_attn.o_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.self_attn.q_norm.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.self_attn.q_proj.bias": "model-00016-of-00092.safetensors",
+ "model.layers.15.self_attn.q_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.self_attn.q_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.15.self_attn.v_proj.bias": "model-00016-of-00092.safetensors",
+ "model.layers.15.self_attn.v_proj.weight": "model-00016-of-00092.safetensors",
+ "model.layers.15.self_attn.v_proj.weight_scale": "model-00016-of-00092.safetensors",
+ "model.layers.16.input_layernorm.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.0.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.0.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.0.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.0.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.0.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.0.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.1.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.1.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.1.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.1.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.1.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.1.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.10.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.10.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.10.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.10.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.10.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.10.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.100.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.100.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.100.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.100.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.100.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.100.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.101.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.101.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.101.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.101.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.101.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.101.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.102.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.102.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.102.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.102.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.102.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.102.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.103.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.103.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.103.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.103.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.103.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.103.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.104.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.104.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.104.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.104.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.104.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.104.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.105.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.105.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.105.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.105.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.105.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.105.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.106.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.106.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.106.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.106.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.106.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.106.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.107.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.107.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.107.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.107.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.107.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.107.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.108.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.108.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.108.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.108.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.108.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.108.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.109.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.109.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.109.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.109.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.109.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.109.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.11.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.11.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.11.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.11.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.11.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.11.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.110.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.110.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.110.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.110.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.110.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.110.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.111.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.111.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.111.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.111.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.111.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.111.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.112.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.112.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.112.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.112.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.112.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.112.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.113.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.113.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.113.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.113.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.113.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.113.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.114.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.114.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.114.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.114.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.114.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.114.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.115.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.115.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.115.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.115.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.115.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.115.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.116.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.116.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.116.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.116.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.116.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.116.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.117.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.117.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.117.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.117.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.117.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.117.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.118.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.118.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.118.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.118.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.118.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.118.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.119.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.119.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.119.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.119.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.119.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.119.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.12.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.12.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.12.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.12.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.12.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.12.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.120.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.120.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.120.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.120.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.120.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.120.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.121.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.121.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.121.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.121.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.121.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.121.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.122.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.122.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.122.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.122.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.122.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.122.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.123.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.123.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.123.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.123.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.123.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.123.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.124.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.124.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.124.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.124.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.124.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.124.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.125.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.125.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.125.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.125.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.125.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.125.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.126.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.126.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.126.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.126.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.126.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.126.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.127.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.127.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.127.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.127.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.127.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.127.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.128.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.128.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.128.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.128.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.128.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.128.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.129.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.129.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.129.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.129.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.129.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.129.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.13.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.13.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.13.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.13.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.13.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.13.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.130.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.130.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.130.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.130.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.130.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.130.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.131.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.131.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.131.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.131.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.131.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.131.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.132.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.132.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.132.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.132.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.132.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.132.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.133.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.133.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.133.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.133.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.133.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.133.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.134.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.134.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.134.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.134.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.134.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.134.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.135.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.135.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.135.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.135.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.135.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.135.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.136.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.136.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.136.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.136.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.136.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.136.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.137.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.137.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.137.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.137.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.137.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.137.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.138.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.138.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.138.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.138.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.138.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.138.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.139.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.139.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.139.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.139.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.139.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.139.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.14.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.14.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.14.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.14.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.14.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.14.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.140.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.140.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.140.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.140.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.140.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.140.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.141.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.141.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.141.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.141.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.141.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.141.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.142.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.142.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.142.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.142.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.142.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.142.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.143.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.143.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.143.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.143.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.143.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.143.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.144.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.144.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.144.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.144.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.144.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.144.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.145.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.145.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.145.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.145.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.145.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.145.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.146.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.146.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.146.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.146.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.146.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.146.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.147.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.147.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.147.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.147.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.147.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.147.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.148.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.148.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.148.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.148.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.148.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.148.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.149.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.149.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.149.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.149.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.149.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.149.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.15.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.15.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.15.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.15.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.15.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.15.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.150.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.150.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.150.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.150.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.150.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.150.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.151.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.151.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.151.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.151.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.151.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.151.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.152.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.152.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.152.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.152.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.152.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.152.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.153.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.153.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.153.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.153.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.153.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.153.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.154.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.154.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.154.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.154.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.154.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.154.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.155.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.155.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.155.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.155.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.155.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.155.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.156.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.156.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.156.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.156.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.156.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.156.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.157.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.157.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.157.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.157.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.157.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.157.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.158.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.158.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.158.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.158.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.158.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.158.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.159.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.159.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.159.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.159.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.159.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.159.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.16.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.16.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.16.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.16.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.16.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.16.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.17.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.17.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.17.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.17.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.17.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.17.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.18.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.18.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.18.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.18.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.18.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.18.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.19.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.19.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.19.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.19.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.19.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.19.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.2.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.2.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.2.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.2.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.2.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.2.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.20.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.20.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.20.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.20.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.20.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.20.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.21.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.21.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.21.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.21.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.21.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.21.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.22.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.22.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.22.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.22.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.22.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.22.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.23.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.23.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.23.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.23.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.23.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.23.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.24.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.24.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.24.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.24.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.24.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.24.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.25.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.25.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.25.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.25.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.25.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.25.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.26.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.26.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.26.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.26.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.26.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.26.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.27.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.27.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.27.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.27.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.27.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.27.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.28.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.28.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.28.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.28.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.28.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.28.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.29.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.29.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.29.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.29.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.29.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.29.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.3.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.3.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.3.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.3.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.3.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.3.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.30.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.30.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.30.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.30.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.30.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.30.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.31.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.31.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.31.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.31.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.31.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.31.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.32.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.32.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.32.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.32.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.32.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.32.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.33.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.33.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.33.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.33.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.33.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.33.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.34.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.34.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.34.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.34.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.34.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.34.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.35.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.35.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.35.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.35.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.35.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.35.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.36.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.36.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.36.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.36.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.36.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.36.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.37.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.37.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.37.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.37.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.37.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.37.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.38.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.38.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.38.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.38.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.38.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.38.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.39.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.39.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.39.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.39.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.39.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.39.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.4.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.4.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.4.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.4.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.4.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.4.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.40.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.40.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.40.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.40.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.40.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.40.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.41.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.41.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.41.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.41.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.41.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.41.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.42.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.42.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.42.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.42.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.42.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.42.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.43.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.43.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.43.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.43.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.43.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.43.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.44.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.44.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.44.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.44.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.44.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.44.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.45.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.45.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.45.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.45.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.45.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.45.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.46.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.46.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.46.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.46.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.46.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.46.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.47.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.47.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.47.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.47.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.47.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.47.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.48.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.48.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.48.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.48.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.48.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.48.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.49.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.49.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.49.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.49.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.49.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.49.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.5.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.5.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.5.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.5.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.5.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.5.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.50.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.50.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.50.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.50.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.50.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.50.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.51.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.51.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.51.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.51.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.51.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.51.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.52.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.52.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.52.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.52.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.52.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.52.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.53.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.53.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.53.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.53.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.53.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.53.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.54.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.54.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.54.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.54.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.54.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.54.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.55.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.55.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.55.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.55.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.55.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.55.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.56.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.56.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.56.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.56.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.56.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.56.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.57.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.57.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.57.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.57.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.57.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.57.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.58.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.58.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.58.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.58.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.58.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.58.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.59.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.59.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.59.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.59.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.59.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.59.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.6.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.6.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.6.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.6.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.6.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.6.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.60.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.60.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.60.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.60.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.60.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.60.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.61.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.61.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.61.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.61.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.61.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.61.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.62.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.62.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.62.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.62.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.62.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.62.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.63.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.63.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.63.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.63.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.63.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.63.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.64.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.64.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.64.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.64.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.64.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.64.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.65.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.65.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.65.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.65.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.65.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.65.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.66.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.66.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.66.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.66.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.66.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.66.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.67.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.67.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.67.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.67.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.67.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.67.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.68.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.68.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.68.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.68.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.68.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.68.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.69.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.69.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.69.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.69.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.69.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.69.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.7.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.7.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.7.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.7.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.7.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.7.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.70.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.70.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.70.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.70.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.70.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.70.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.71.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.71.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.71.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.71.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.71.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.71.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.72.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.72.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.72.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.72.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.72.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.72.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.73.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.73.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.73.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.73.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.73.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.73.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.74.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.74.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.74.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.74.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.74.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.74.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.75.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.75.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.75.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.75.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.75.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.75.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.76.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.76.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.76.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.76.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.76.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.76.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.77.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.77.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.77.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.77.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.77.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.77.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.78.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.78.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.78.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.78.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.78.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.78.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.79.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.79.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.79.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.79.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.79.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.79.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.8.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.8.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.8.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.8.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.8.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.8.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.80.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.80.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.80.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.80.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.80.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.80.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.81.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.81.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.81.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.81.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.81.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.81.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.82.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.82.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.82.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.82.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.82.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.82.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.83.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.83.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.83.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.83.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.83.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.83.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.84.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.84.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.84.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.84.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.84.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.84.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.85.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.85.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.85.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.85.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.85.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.85.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.86.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.86.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.86.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.86.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.86.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.86.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.87.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.87.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.87.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.87.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.87.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.87.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.88.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.88.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.88.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.88.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.88.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.88.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.89.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.89.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.89.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.89.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.89.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.89.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.9.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.9.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.9.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.9.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.9.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.9.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.90.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.90.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.90.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.90.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.90.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.90.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.91.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.91.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.91.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.91.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.91.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.91.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.92.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.92.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.92.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.92.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.92.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.92.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.93.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.93.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.93.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.93.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.93.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.93.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.94.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.94.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.94.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.94.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.94.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.94.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.95.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.95.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.95.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.95.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.95.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.95.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.96.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.96.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.96.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.96.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.96.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.96.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.97.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.97.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.97.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.97.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.97.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.97.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.98.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.98.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.98.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.98.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.98.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.98.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.99.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.99.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.99.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.99.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.99.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.experts.99.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.gate.e_score_correction_bias": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.gate.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.shared_experts.down_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.shared_experts.down_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.shared_experts.gate_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.shared_experts.gate_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.shared_experts.up_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.mlp.shared_experts.up_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.post_attention_layernorm.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.self_attn.k_norm.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.self_attn.k_proj.bias": "model-00017-of-00092.safetensors",
+ "model.layers.16.self_attn.k_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.self_attn.k_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.self_attn.o_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.self_attn.o_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.self_attn.q_norm.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.self_attn.q_proj.bias": "model-00017-of-00092.safetensors",
+ "model.layers.16.self_attn.q_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.self_attn.q_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.16.self_attn.v_proj.bias": "model-00017-of-00092.safetensors",
+ "model.layers.16.self_attn.v_proj.weight": "model-00017-of-00092.safetensors",
+ "model.layers.16.self_attn.v_proj.weight_scale": "model-00017-of-00092.safetensors",
+ "model.layers.17.input_layernorm.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.0.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.0.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.0.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.0.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.0.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.0.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.1.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.1.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.1.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.1.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.1.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.1.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.10.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.10.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.10.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.10.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.10.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.10.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.100.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.100.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.100.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.100.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.100.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.100.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.101.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.101.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.101.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.101.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.101.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.101.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.102.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.102.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.102.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.102.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.102.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.102.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.103.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.103.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.103.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.103.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.103.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.103.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.104.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.104.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.104.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.104.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.104.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.104.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.105.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.105.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.105.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.105.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.105.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.105.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.106.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.106.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.106.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.106.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.106.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.106.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.107.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.107.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.107.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.107.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.107.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.107.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.108.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.108.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.108.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.108.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.108.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.108.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.109.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.109.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.109.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.109.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.109.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.109.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.11.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.11.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.11.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.11.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.11.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.11.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.110.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.110.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.110.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.110.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.110.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.110.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.111.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.111.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.111.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.111.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.111.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.111.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.112.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.112.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.112.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.112.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.112.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.112.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.113.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.113.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.113.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.113.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.113.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.113.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.114.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.114.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.114.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.114.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.114.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.114.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.115.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.115.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.115.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.115.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.115.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.115.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.116.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.116.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.116.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.116.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.116.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.116.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.117.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.117.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.117.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.117.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.117.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.117.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.118.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.118.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.118.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.118.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.118.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.118.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.119.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.119.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.119.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.119.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.119.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.119.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.12.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.12.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.12.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.12.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.12.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.12.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.120.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.120.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.120.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.120.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.120.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.120.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.121.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.121.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.121.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.121.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.121.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.121.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.122.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.122.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.122.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.122.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.122.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.122.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.123.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.123.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.123.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.123.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.123.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.123.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.124.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.124.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.124.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.124.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.124.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.124.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.125.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.125.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.125.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.125.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.125.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.125.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.126.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.126.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.126.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.126.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.126.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.126.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.127.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.127.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.127.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.127.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.127.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.127.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.128.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.128.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.128.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.128.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.128.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.128.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.129.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.129.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.129.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.129.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.129.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.129.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.13.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.13.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.13.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.13.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.13.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.13.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.130.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.130.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.130.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.130.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.130.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.130.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.131.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.131.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.131.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.131.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.131.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.131.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.132.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.132.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.132.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.132.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.132.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.132.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.133.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.133.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.133.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.133.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.133.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.133.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.134.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.134.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.134.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.134.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.134.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.134.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.135.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.135.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.135.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.135.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.135.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.135.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.136.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.136.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.136.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.136.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.136.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.136.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.137.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.137.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.137.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.137.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.137.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.137.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.138.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.138.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.138.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.138.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.138.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.138.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.139.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.139.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.139.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.139.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.139.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.139.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.14.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.14.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.14.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.14.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.14.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.14.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.140.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.140.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.140.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.140.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.140.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.140.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.141.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.141.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.141.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.141.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.141.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.141.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.142.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.142.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.142.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.142.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.142.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.142.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.143.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.143.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.143.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.143.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.143.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.143.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.144.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.144.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.144.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.144.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.144.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.144.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.145.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.145.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.145.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.145.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.145.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.145.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.146.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.146.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.146.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.146.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.146.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.146.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.147.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.147.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.147.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.147.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.147.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.147.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.148.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.148.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.148.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.148.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.148.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.148.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.149.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.149.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.149.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.149.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.149.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.149.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.15.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.15.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.15.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.15.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.15.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.15.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.150.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.150.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.150.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.150.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.150.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.150.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.151.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.151.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.151.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.151.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.151.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.151.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.152.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.152.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.152.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.152.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.152.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.152.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.153.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.153.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.153.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.153.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.153.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.153.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.154.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.154.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.154.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.154.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.154.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.154.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.155.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.155.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.155.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.155.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.155.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.155.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.156.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.156.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.156.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.156.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.156.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.156.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.157.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.157.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.157.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.157.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.157.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.157.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.158.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.158.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.158.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.158.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.158.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.158.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.159.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.159.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.159.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.159.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.159.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.159.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.16.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.16.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.16.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.16.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.16.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.16.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.17.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.17.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.17.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.17.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.17.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.17.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.18.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.18.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.18.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.18.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.18.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.18.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.19.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.19.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.19.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.19.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.19.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.19.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.2.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.2.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.2.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.2.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.2.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.2.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.20.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.20.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.20.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.20.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.20.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.20.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.21.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.21.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.21.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.21.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.21.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.21.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.22.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.22.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.22.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.22.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.22.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.22.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.23.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.23.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.23.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.23.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.23.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.23.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.24.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.24.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.24.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.24.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.24.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.24.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.25.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.25.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.25.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.25.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.25.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.25.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.26.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.26.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.26.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.26.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.26.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.26.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.27.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.27.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.27.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.27.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.27.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.27.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.28.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.28.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.28.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.28.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.28.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.28.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.29.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.29.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.29.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.29.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.29.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.29.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.3.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.3.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.3.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.3.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.3.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.3.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.30.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.30.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.30.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.30.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.30.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.30.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.31.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.31.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.31.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.31.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.31.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.31.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.32.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.32.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.32.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.32.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.32.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.32.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.33.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.33.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.33.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.33.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.33.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.33.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.34.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.34.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.34.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.34.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.34.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.34.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.35.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.35.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.35.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.35.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.35.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.35.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.36.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.36.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.36.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.36.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.36.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.36.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.37.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.37.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.37.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.37.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.37.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.37.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.38.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.38.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.38.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.38.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.38.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.38.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.39.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.39.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.39.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.39.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.39.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.39.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.4.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.4.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.4.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.4.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.4.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.4.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.40.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.40.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.40.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.40.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.40.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.40.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.41.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.41.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.41.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.41.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.41.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.41.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.42.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.42.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.42.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.42.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.42.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.42.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.43.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.43.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.43.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.43.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.43.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.43.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.44.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.44.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.44.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.44.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.44.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.44.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.45.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.45.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.45.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.45.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.45.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.45.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.46.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.46.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.46.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.46.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.46.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.46.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.47.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.47.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.47.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.47.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.47.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.47.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.48.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.48.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.48.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.48.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.48.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.48.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.49.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.49.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.49.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.49.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.49.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.49.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.5.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.5.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.5.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.5.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.5.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.5.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.50.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.50.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.50.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.50.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.50.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.50.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.51.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.51.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.51.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.51.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.51.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.51.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.52.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.52.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.52.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.52.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.52.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.52.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.53.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.53.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.53.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.53.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.53.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.53.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.54.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.54.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.54.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.54.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.54.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.54.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.55.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.55.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.55.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.55.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.55.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.55.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.56.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.56.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.56.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.56.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.56.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.56.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.57.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.57.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.57.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.57.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.57.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.57.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.58.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.58.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.58.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.58.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.58.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.58.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.59.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.59.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.59.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.59.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.59.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.59.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.6.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.6.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.6.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.6.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.6.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.6.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.60.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.60.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.60.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.60.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.60.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.60.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.61.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.61.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.61.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.61.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.61.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.61.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.62.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.62.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.62.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.62.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.62.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.62.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.63.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.63.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.63.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.63.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.63.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.63.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.64.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.64.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.64.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.64.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.64.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.64.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.65.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.65.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.65.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.65.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.65.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.65.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.66.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.66.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.66.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.66.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.66.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.66.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.67.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.67.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.67.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.67.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.67.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.67.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.68.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.68.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.68.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.68.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.68.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.68.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.69.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.69.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.69.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.69.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.69.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.69.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.7.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.7.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.7.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.7.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.7.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.7.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.70.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.70.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.70.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.70.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.70.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.70.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.71.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.71.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.71.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.71.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.71.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.71.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.72.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.72.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.72.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.72.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.72.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.72.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.73.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.73.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.73.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.73.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.73.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.73.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.74.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.74.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.74.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.74.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.74.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.74.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.75.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.75.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.75.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.75.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.75.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.75.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.76.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.76.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.76.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.76.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.76.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.76.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.77.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.77.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.77.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.77.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.77.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.77.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.78.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.78.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.78.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.78.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.78.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.78.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.79.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.79.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.79.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.79.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.79.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.79.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.8.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.8.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.8.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.8.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.8.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.8.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.80.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.80.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.80.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.80.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.80.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.80.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.81.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.81.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.81.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.81.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.81.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.81.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.82.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.82.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.82.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.82.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.82.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.82.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.83.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.83.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.83.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.83.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.83.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.83.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.84.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.84.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.84.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.84.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.84.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.84.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.85.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.85.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.85.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.85.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.85.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.85.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.86.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.86.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.86.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.86.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.86.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.86.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.87.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.87.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.87.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.87.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.87.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.87.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.88.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.88.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.88.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.88.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.88.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.88.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.89.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.89.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.89.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.89.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.89.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.89.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.9.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.9.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.9.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.9.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.9.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.9.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.90.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.90.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.90.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.90.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.90.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.90.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.91.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.91.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.91.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.91.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.91.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.91.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.92.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.92.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.92.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.92.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.92.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.92.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.93.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.93.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.93.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.93.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.93.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.93.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.94.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.94.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.94.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.94.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.94.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.94.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.95.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.95.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.95.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.95.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.95.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.95.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.96.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.96.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.96.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.96.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.96.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.96.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.97.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.97.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.97.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.97.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.97.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.97.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.98.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.98.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.98.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.98.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.98.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.98.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.99.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.99.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.99.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.99.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.99.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.experts.99.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.gate.e_score_correction_bias": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.gate.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.shared_experts.down_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.shared_experts.down_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.shared_experts.gate_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.shared_experts.gate_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.shared_experts.up_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.mlp.shared_experts.up_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.post_attention_layernorm.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.self_attn.k_norm.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.self_attn.k_proj.bias": "model-00018-of-00092.safetensors",
+ "model.layers.17.self_attn.k_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.self_attn.k_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.self_attn.o_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.self_attn.o_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.self_attn.q_norm.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.self_attn.q_proj.bias": "model-00018-of-00092.safetensors",
+ "model.layers.17.self_attn.q_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.self_attn.q_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.17.self_attn.v_proj.bias": "model-00018-of-00092.safetensors",
+ "model.layers.17.self_attn.v_proj.weight": "model-00018-of-00092.safetensors",
+ "model.layers.17.self_attn.v_proj.weight_scale": "model-00018-of-00092.safetensors",
+ "model.layers.18.input_layernorm.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.0.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.0.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.0.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.0.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.0.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.0.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.1.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.1.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.1.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.1.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.1.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.1.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.10.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.10.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.10.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.10.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.10.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.10.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.100.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.100.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.100.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.100.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.100.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.100.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.101.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.101.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.101.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.101.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.101.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.101.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.102.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.102.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.102.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.102.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.102.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.102.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.103.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.103.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.103.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.103.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.103.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.103.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.104.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.104.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.104.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.104.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.104.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.104.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.105.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.105.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.105.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.105.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.105.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.105.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.106.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.106.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.106.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.106.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.106.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.106.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.107.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.107.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.107.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.107.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.107.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.107.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.108.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.108.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.108.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.108.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.108.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.108.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.109.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.109.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.109.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.109.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.109.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.109.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.11.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.11.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.11.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.11.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.11.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.11.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.110.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.110.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.110.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.110.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.110.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.110.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.111.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.111.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.111.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.111.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.111.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.111.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.112.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.112.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.112.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.112.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.112.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.112.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.113.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.113.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.113.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.113.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.113.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.113.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.114.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.114.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.114.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.114.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.114.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.114.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.115.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.115.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.115.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.115.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.115.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.115.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.116.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.116.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.116.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.116.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.116.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.116.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.117.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.117.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.117.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.117.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.117.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.117.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.118.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.118.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.118.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.118.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.118.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.118.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.119.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.119.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.119.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.119.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.119.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.119.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.12.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.12.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.12.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.12.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.12.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.12.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.120.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.120.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.120.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.120.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.120.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.120.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.121.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.121.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.121.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.121.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.121.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.121.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.122.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.122.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.122.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.122.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.122.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.122.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.123.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.123.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.123.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.123.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.123.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.123.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.124.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.124.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.124.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.124.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.124.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.124.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.125.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.125.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.125.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.125.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.125.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.125.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.126.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.126.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.126.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.126.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.126.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.126.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.127.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.127.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.127.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.127.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.127.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.127.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.128.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.128.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.128.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.128.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.128.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.128.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.129.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.129.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.129.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.129.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.129.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.129.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.13.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.13.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.13.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.13.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.13.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.13.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.130.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.130.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.130.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.130.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.130.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.130.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.131.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.131.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.131.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.131.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.131.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.131.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.132.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.132.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.132.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.132.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.132.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.132.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.133.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.133.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.133.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.133.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.133.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.133.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.134.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.134.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.134.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.134.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.134.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.134.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.135.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.135.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.135.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.135.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.135.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.135.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.136.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.136.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.136.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.136.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.136.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.136.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.137.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.137.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.137.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.137.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.137.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.137.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.138.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.138.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.138.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.138.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.138.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.138.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.139.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.139.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.139.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.139.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.139.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.139.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.14.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.14.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.14.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.14.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.14.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.14.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.140.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.140.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.140.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.140.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.140.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.140.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.141.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.141.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.141.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.141.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.141.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.141.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.142.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.142.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.142.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.142.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.142.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.142.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.143.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.143.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.143.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.143.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.143.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.143.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.144.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.144.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.144.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.144.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.144.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.144.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.145.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.145.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.145.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.145.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.145.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.145.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.146.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.146.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.146.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.146.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.146.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.146.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.147.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.147.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.147.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.147.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.147.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.147.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.148.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.148.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.148.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.148.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.148.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.148.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.149.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.149.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.149.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.149.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.149.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.149.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.15.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.15.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.15.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.15.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.15.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.15.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.150.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.150.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.150.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.150.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.150.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.150.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.151.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.151.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.151.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.151.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.151.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.151.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.152.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.152.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.152.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.152.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.152.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.152.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.153.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.153.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.153.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.153.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.153.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.153.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.154.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.154.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.154.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.154.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.154.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.154.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.155.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.155.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.155.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.155.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.155.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.155.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.156.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.156.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.156.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.156.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.156.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.156.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.157.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.157.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.157.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.157.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.157.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.157.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.158.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.158.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.158.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.158.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.158.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.158.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.159.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.159.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.159.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.159.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.159.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.159.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.16.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.16.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.16.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.16.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.16.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.16.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.17.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.17.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.17.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.17.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.17.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.17.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.18.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.18.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.18.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.18.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.18.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.18.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.19.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.19.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.19.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.19.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.19.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.19.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.2.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.2.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.2.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.2.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.2.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.2.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.20.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.20.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.20.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.20.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.20.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.20.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.21.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.21.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.21.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.21.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.21.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.21.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.22.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.22.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.22.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.22.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.22.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.22.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.23.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.23.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.23.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.23.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.23.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.23.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.24.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.24.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.24.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.24.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.24.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.24.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.25.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.25.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.25.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.25.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.25.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.25.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.26.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.26.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.26.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.26.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.26.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.26.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.27.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.27.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.27.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.27.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.27.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.27.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.28.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.28.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.28.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.28.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.28.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.28.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.29.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.29.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.29.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.29.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.29.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.29.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.3.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.3.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.3.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.3.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.3.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.3.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.30.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.30.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.30.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.30.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.30.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.30.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.31.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.31.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.31.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.31.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.31.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.31.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.32.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.32.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.32.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.32.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.32.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.32.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.33.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.33.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.33.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.33.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.33.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.33.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.34.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.34.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.34.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.34.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.34.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.34.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.35.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.35.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.35.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.35.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.35.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.35.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.36.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.36.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.36.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.36.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.36.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.36.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.37.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.37.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.37.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.37.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.37.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.37.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.38.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.38.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.38.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.38.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.38.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.38.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.39.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.39.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.39.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.39.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.39.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.39.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.4.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.4.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.4.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.4.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.4.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.4.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.40.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.40.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.40.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.40.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.40.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.40.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.41.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.41.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.41.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.41.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.41.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.41.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.42.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.42.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.42.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.42.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.42.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.42.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.43.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.43.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.43.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.43.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.43.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.43.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.44.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.44.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.44.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.44.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.44.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.44.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.45.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.45.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.45.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.45.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.45.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.45.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.46.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.46.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.46.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.46.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.46.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.46.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.47.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.47.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.47.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.47.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.47.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.47.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.48.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.48.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.48.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.48.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.48.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.48.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.49.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.49.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.49.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.49.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.49.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.49.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.5.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.5.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.5.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.5.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.5.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.5.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.50.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.50.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.50.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.50.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.50.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.50.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.51.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.51.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.51.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.51.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.51.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.51.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.52.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.52.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.52.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.52.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.52.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.52.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.53.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.53.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.53.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.53.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.53.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.53.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.54.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.54.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.54.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.54.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.54.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.54.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.55.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.55.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.55.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.55.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.55.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.55.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.56.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.56.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.56.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.56.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.56.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.56.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.57.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.57.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.57.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.57.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.57.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.57.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.58.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.58.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.58.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.58.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.58.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.58.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.59.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.59.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.59.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.59.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.59.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.59.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.6.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.6.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.6.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.6.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.6.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.6.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.60.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.60.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.60.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.60.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.60.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.60.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.61.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.61.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.61.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.61.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.61.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.61.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.62.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.62.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.62.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.62.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.62.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.62.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.63.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.63.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.63.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.63.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.63.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.63.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.64.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.64.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.64.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.64.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.64.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.64.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.65.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.65.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.65.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.65.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.65.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.65.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.66.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.66.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.66.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.66.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.66.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.66.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.67.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.67.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.67.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.67.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.67.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.67.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.68.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.68.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.68.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.68.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.68.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.68.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.69.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.69.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.69.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.69.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.69.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.69.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.7.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.7.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.7.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.7.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.7.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.7.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.70.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.70.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.70.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.70.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.70.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.70.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.71.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.71.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.71.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.71.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.71.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.71.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.72.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.72.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.72.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.72.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.72.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.72.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.73.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.73.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.73.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.73.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.73.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.73.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.74.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.74.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.74.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.74.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.74.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.74.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.75.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.75.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.75.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.75.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.75.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.75.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.76.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.76.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.76.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.76.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.76.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.76.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.77.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.77.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.77.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.77.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.77.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.77.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.78.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.78.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.78.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.78.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.78.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.78.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.79.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.79.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.79.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.79.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.79.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.79.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.8.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.8.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.8.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.8.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.8.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.8.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.80.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.80.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.80.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.80.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.80.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.80.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.81.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.81.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.81.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.81.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.81.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.81.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.82.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.82.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.82.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.82.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.82.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.82.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.83.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.83.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.83.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.83.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.83.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.83.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.84.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.84.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.84.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.84.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.84.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.84.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.85.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.85.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.85.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.85.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.85.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.85.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.86.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.86.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.86.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.86.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.86.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.86.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.87.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.87.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.87.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.87.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.87.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.87.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.88.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.88.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.88.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.88.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.88.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.88.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.89.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.89.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.89.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.89.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.89.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.89.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.9.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.9.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.9.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.9.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.9.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.9.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.90.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.90.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.90.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.90.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.90.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.90.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.91.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.91.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.91.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.91.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.91.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.91.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.92.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.92.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.92.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.92.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.92.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.92.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.93.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.93.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.93.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.93.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.93.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.93.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.94.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.94.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.94.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.94.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.94.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.94.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.95.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.95.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.95.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.95.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.95.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.95.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.96.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.96.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.96.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.96.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.96.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.96.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.97.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.97.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.97.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.97.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.97.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.97.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.98.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.98.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.98.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.98.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.98.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.98.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.99.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.99.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.99.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.99.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.99.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.experts.99.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.gate.e_score_correction_bias": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.gate.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.shared_experts.down_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.shared_experts.down_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.shared_experts.gate_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.shared_experts.gate_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.shared_experts.up_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.mlp.shared_experts.up_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.post_attention_layernorm.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.self_attn.k_norm.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.self_attn.k_proj.bias": "model-00019-of-00092.safetensors",
+ "model.layers.18.self_attn.k_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.self_attn.k_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.self_attn.o_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.self_attn.o_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.self_attn.q_norm.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.self_attn.q_proj.bias": "model-00019-of-00092.safetensors",
+ "model.layers.18.self_attn.q_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.self_attn.q_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.18.self_attn.v_proj.bias": "model-00019-of-00092.safetensors",
+ "model.layers.18.self_attn.v_proj.weight": "model-00019-of-00092.safetensors",
+ "model.layers.18.self_attn.v_proj.weight_scale": "model-00019-of-00092.safetensors",
+ "model.layers.19.input_layernorm.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.0.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.0.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.0.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.0.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.0.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.0.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.1.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.1.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.1.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.1.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.1.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.1.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.10.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.10.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.10.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.10.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.10.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.10.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.100.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.100.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.100.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.100.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.100.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.100.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.101.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.101.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.101.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.101.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.101.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.101.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.102.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.102.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.102.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.102.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.102.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.102.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.103.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.103.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.103.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.103.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.103.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.103.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.104.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.104.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.104.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.104.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.104.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.104.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.105.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.105.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.105.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.105.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.105.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.105.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.106.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.106.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.106.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.106.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.106.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.106.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.107.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.107.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.107.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.107.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.107.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.107.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.108.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.108.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.108.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.108.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.108.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.108.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.109.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.109.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.109.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.109.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.109.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.109.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.11.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.11.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.11.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.11.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.11.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.11.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.110.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.110.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.110.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.110.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.110.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.110.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.111.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.111.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.111.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.111.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.111.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.111.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.112.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.112.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.112.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.112.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.112.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.112.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.113.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.113.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.113.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.113.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.113.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.113.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.114.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.114.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.114.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.114.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.114.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.114.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.115.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.115.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.115.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.115.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.115.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.115.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.116.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.116.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.116.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.116.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.116.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.116.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.117.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.117.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.117.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.117.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.117.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.117.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.118.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.118.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.118.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.118.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.118.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.118.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.119.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.119.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.119.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.119.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.119.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.119.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.12.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.12.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.12.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.12.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.12.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.12.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.120.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.120.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.120.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.120.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.120.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.120.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.121.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.121.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.121.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.121.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.121.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.121.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.122.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.122.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.122.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.122.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.122.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.122.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.123.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.123.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.123.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.123.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.123.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.123.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.124.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.124.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.124.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.124.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.124.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.124.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.125.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.125.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.125.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.125.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.125.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.125.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.126.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.126.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.126.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.126.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.126.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.126.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.127.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.127.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.127.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.127.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.127.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.127.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.128.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.128.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.128.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.128.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.128.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.128.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.129.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.129.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.129.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.129.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.129.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.129.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.13.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.13.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.13.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.13.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.13.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.13.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.130.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.130.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.130.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.130.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.130.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.130.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.131.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.131.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.131.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.131.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.131.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.131.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.132.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.132.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.132.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.132.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.132.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.132.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.133.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.133.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.133.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.133.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.133.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.133.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.134.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.134.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.134.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.134.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.134.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.134.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.135.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.135.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.135.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.135.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.135.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.135.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.136.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.136.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.136.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.136.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.136.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.136.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.137.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.137.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.137.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.137.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.137.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.137.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.138.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.138.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.138.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.138.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.138.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.138.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.139.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.139.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.139.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.139.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.139.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.139.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.14.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.14.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.14.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.14.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.14.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.14.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.140.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.140.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.140.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.140.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.140.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.140.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.141.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.141.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.141.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.141.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.141.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.141.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.142.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.142.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.142.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.142.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.142.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.142.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.143.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.143.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.143.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.143.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.143.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.143.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.144.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.144.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.144.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.144.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.144.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.144.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.145.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.145.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.145.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.145.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.145.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.145.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.146.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.146.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.146.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.146.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.146.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.146.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.147.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.147.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.147.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.147.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.147.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.147.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.148.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.148.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.148.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.148.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.148.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.148.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.149.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.149.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.149.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.149.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.149.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.149.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.15.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.15.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.15.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.15.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.15.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.15.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.150.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.150.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.150.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.150.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.150.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.150.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.151.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.151.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.151.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.151.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.151.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.151.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.152.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.152.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.152.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.152.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.152.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.152.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.153.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.153.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.153.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.153.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.153.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.153.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.154.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.154.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.154.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.154.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.154.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.154.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.155.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.155.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.155.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.155.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.155.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.155.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.156.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.156.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.156.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.156.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.156.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.156.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.157.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.157.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.157.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.157.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.157.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.157.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.158.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.158.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.158.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.158.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.158.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.158.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.159.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.159.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.159.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.159.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.159.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.159.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.16.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.16.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.16.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.16.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.16.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.16.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.17.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.17.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.17.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.17.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.17.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.17.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.18.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.18.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.18.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.18.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.18.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.18.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.19.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.19.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.19.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.19.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.19.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.19.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.2.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.2.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.2.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.2.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.2.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.2.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.20.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.20.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.20.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.20.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.20.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.20.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.21.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.21.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.21.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.21.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.21.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.21.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.22.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.22.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.22.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.22.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.22.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.22.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.23.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.23.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.23.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.23.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.23.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.23.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.24.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.24.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.24.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.24.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.24.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.24.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.25.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.25.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.25.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.25.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.25.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.25.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.26.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.26.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.26.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.26.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.26.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.26.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.27.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.27.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.27.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.27.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.27.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.27.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.28.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.28.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.28.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.28.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.28.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.28.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.29.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.29.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.29.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.29.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.29.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.29.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.3.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.3.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.3.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.3.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.3.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.3.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.30.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.30.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.30.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.30.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.30.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.30.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.31.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.31.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.31.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.31.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.31.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.31.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.32.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.32.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.32.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.32.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.32.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.32.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.33.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.33.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.33.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.33.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.33.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.33.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.34.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.34.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.34.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.34.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.34.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.34.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.35.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.35.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.35.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.35.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.35.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.35.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.36.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.36.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.36.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.36.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.36.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.36.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.37.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.37.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.37.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.37.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.37.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.37.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.38.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.38.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.38.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.38.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.38.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.38.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.39.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.39.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.39.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.39.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.39.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.39.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.4.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.4.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.4.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.4.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.4.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.4.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.40.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.40.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.40.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.40.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.40.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.40.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.41.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.41.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.41.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.41.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.41.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.41.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.42.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.42.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.42.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.42.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.42.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.42.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.43.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.43.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.43.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.43.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.43.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.43.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.44.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.44.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.44.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.44.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.44.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.44.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.45.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.45.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.45.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.45.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.45.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.45.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.46.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.46.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.46.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.46.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.46.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.46.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.47.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.47.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.47.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.47.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.47.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.47.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.48.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.48.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.48.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.48.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.48.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.48.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.49.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.49.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.49.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.49.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.49.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.49.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.5.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.5.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.5.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.5.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.5.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.5.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.50.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.50.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.50.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.50.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.50.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.50.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.51.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.51.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.51.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.51.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.51.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.51.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.52.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.52.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.52.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.52.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.52.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.52.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.53.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.53.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.53.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.53.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.53.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.53.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.54.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.54.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.54.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.54.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.54.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.54.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.55.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.55.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.55.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.55.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.55.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.55.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.56.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.56.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.56.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.56.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.56.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.56.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.57.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.57.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.57.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.57.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.57.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.57.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.58.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.58.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.58.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.58.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.58.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.58.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.59.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.59.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.59.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.59.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.59.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.59.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.6.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.6.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.6.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.6.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.6.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.6.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.60.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.60.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.60.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.60.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.60.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.60.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.61.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.61.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.61.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.61.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.61.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.61.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.62.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.62.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.62.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.62.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.62.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.62.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.63.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.63.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.63.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.63.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.63.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.63.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.64.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.64.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.64.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.64.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.64.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.64.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.65.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.65.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.65.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.65.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.65.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.65.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.66.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.66.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.66.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.66.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.66.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.66.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.67.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.67.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.67.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.67.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.67.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.67.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.68.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.68.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.68.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.68.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.68.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.68.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.69.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.69.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.69.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.69.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.69.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.69.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.7.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.7.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.7.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.7.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.7.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.7.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.70.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.70.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.70.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.70.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.70.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.70.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.71.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.71.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.71.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.71.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.71.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.71.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.72.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.72.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.72.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.72.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.72.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.72.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.73.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.73.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.73.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.73.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.73.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.73.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.74.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.74.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.74.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.74.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.74.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.74.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.75.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.75.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.75.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.75.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.75.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.75.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.76.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.76.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.76.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.76.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.76.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.76.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.77.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.77.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.77.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.77.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.77.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.77.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.78.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.78.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.78.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.78.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.78.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.78.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.79.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.79.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.79.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.79.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.79.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.79.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.8.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.8.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.8.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.8.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.8.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.8.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.80.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.80.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.80.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.80.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.80.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.80.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.81.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.81.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.81.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.81.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.81.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.81.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.82.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.82.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.82.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.82.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.82.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.82.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.83.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.83.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.83.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.83.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.83.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.83.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.84.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.84.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.84.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.84.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.84.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.84.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.85.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.85.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.85.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.85.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.85.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.85.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.86.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.86.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.86.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.86.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.86.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.86.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.87.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.87.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.87.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.87.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.87.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.87.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.88.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.88.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.88.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.88.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.88.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.88.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.89.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.89.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.89.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.89.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.89.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.89.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.9.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.9.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.9.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.9.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.9.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.9.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.90.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.90.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.90.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.90.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.90.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.90.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.91.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.91.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.91.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.91.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.91.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.91.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.92.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.92.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.92.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.92.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.92.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.92.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.93.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.93.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.93.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.93.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.93.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.93.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.94.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.94.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.94.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.94.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.94.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.94.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.95.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.95.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.95.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.95.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.95.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.95.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.96.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.96.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.96.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.96.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.96.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.96.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.97.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.97.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.97.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.97.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.97.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.97.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.98.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.98.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.98.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.98.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.98.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.98.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.99.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.99.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.99.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.99.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.99.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.experts.99.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.gate.e_score_correction_bias": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.gate.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.shared_experts.down_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.shared_experts.down_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.shared_experts.gate_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.shared_experts.gate_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.shared_experts.up_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.mlp.shared_experts.up_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.post_attention_layernorm.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.self_attn.k_norm.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.self_attn.k_proj.bias": "model-00020-of-00092.safetensors",
+ "model.layers.19.self_attn.k_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.self_attn.k_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.self_attn.o_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.self_attn.o_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.self_attn.q_norm.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.self_attn.q_proj.bias": "model-00020-of-00092.safetensors",
+ "model.layers.19.self_attn.q_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.self_attn.q_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.19.self_attn.v_proj.bias": "model-00020-of-00092.safetensors",
+ "model.layers.19.self_attn.v_proj.weight": "model-00020-of-00092.safetensors",
+ "model.layers.19.self_attn.v_proj.weight_scale": "model-00020-of-00092.safetensors",
+ "model.layers.2.input_layernorm.weight": "model-00003-of-00092.safetensors",
+ "model.layers.2.mlp.down_proj.weight": "model-00003-of-00092.safetensors",
+ "model.layers.2.mlp.down_proj.weight_scale": "model-00003-of-00092.safetensors",
+ "model.layers.2.mlp.gate_proj.weight": "model-00003-of-00092.safetensors",
+ "model.layers.2.mlp.gate_proj.weight_scale": "model-00003-of-00092.safetensors",
+ "model.layers.2.mlp.up_proj.weight": "model-00003-of-00092.safetensors",
+ "model.layers.2.mlp.up_proj.weight_scale": "model-00003-of-00092.safetensors",
+ "model.layers.2.post_attention_layernorm.weight": "model-00003-of-00092.safetensors",
+ "model.layers.2.self_attn.k_norm.weight": "model-00003-of-00092.safetensors",
+ "model.layers.2.self_attn.k_proj.bias": "model-00003-of-00092.safetensors",
+ "model.layers.2.self_attn.k_proj.weight": "model-00003-of-00092.safetensors",
+ "model.layers.2.self_attn.k_proj.weight_scale": "model-00003-of-00092.safetensors",
+ "model.layers.2.self_attn.o_proj.weight": "model-00003-of-00092.safetensors",
+ "model.layers.2.self_attn.o_proj.weight_scale": "model-00003-of-00092.safetensors",
+ "model.layers.2.self_attn.q_norm.weight": "model-00003-of-00092.safetensors",
+ "model.layers.2.self_attn.q_proj.bias": "model-00003-of-00092.safetensors",
+ "model.layers.2.self_attn.q_proj.weight": "model-00003-of-00092.safetensors",
+ "model.layers.2.self_attn.q_proj.weight_scale": "model-00003-of-00092.safetensors",
+ "model.layers.2.self_attn.v_proj.bias": "model-00003-of-00092.safetensors",
+ "model.layers.2.self_attn.v_proj.weight": "model-00003-of-00092.safetensors",
+ "model.layers.2.self_attn.v_proj.weight_scale": "model-00003-of-00092.safetensors",
+ "model.layers.20.input_layernorm.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.0.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.0.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.0.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.0.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.0.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.0.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.1.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.1.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.1.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.1.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.1.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.1.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.10.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.10.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.10.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.10.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.10.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.10.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.100.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.100.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.100.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.100.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.100.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.100.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.101.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.101.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.101.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.101.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.101.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.101.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.102.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.102.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.102.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.102.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.102.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.102.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.103.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.103.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.103.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.103.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.103.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.103.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.104.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.104.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.104.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.104.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.104.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.104.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.105.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.105.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.105.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.105.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.105.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.105.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.106.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.106.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.106.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.106.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.106.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.106.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.107.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.107.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.107.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.107.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.107.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.107.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.108.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.108.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.108.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.108.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.108.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.108.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.109.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.109.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.109.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.109.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.109.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.109.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.11.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.11.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.11.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.11.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.11.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.11.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.110.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.110.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.110.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.110.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.110.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.110.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.111.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.111.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.111.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.111.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.111.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.111.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.112.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.112.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.112.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.112.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.112.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.112.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.113.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.113.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.113.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.113.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.113.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.113.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.114.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.114.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.114.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.114.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.114.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.114.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.115.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.115.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.115.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.115.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.115.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.115.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.116.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.116.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.116.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.116.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.116.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.116.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.117.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.117.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.117.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.117.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.117.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.117.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.118.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.118.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.118.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.118.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.118.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.118.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.119.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.119.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.119.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.119.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.119.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.119.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.12.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.12.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.12.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.12.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.12.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.12.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.120.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.120.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.120.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.120.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.120.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.120.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.121.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.121.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.121.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.121.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.121.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.121.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.122.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.122.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.122.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.122.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.122.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.122.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.123.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.123.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.123.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.123.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.123.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.123.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.124.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.124.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.124.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.124.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.124.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.124.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.125.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.125.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.125.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.125.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.125.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.125.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.126.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.126.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.126.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.126.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.126.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.126.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.127.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.127.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.127.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.127.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.127.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.127.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.128.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.128.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.128.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.128.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.128.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.128.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.129.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.129.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.129.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.129.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.129.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.129.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.13.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.13.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.13.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.13.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.13.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.13.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.130.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.130.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.130.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.130.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.130.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.130.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.131.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.131.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.131.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.131.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.131.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.131.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.132.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.132.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.132.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.132.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.132.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.132.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.133.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.133.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.133.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.133.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.133.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.133.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.134.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.134.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.134.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.134.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.134.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.134.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.135.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.135.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.135.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.135.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.135.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.135.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.136.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.136.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.136.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.136.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.136.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.136.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.137.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.137.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.137.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.137.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.137.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.137.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.138.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.138.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.138.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.138.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.138.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.138.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.139.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.139.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.139.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.139.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.139.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.139.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.14.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.14.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.14.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.14.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.14.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.14.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.140.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.140.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.140.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.140.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.140.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.140.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.141.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.141.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.141.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.141.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.141.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.141.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.142.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.142.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.142.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.142.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.142.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.142.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.143.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.143.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.143.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.143.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.143.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.143.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.144.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.144.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.144.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.144.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.144.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.144.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.145.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.145.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.145.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.145.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.145.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.145.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.146.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.146.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.146.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.146.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.146.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.146.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.147.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.147.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.147.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.147.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.147.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.147.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.148.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.148.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.148.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.148.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.148.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.148.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.149.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.149.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.149.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.149.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.149.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.149.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.15.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.15.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.15.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.15.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.15.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.15.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.150.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.150.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.150.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.150.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.150.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.150.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.151.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.151.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.151.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.151.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.151.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.151.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.152.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.152.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.152.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.152.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.152.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.152.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.153.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.153.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.153.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.153.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.153.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.153.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.154.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.154.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.154.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.154.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.154.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.154.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.155.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.155.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.155.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.155.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.155.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.155.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.156.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.156.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.156.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.156.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.156.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.156.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.157.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.157.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.157.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.157.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.157.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.157.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.158.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.158.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.158.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.158.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.158.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.158.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.159.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.159.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.159.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.159.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.159.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.159.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.16.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.16.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.16.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.16.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.16.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.16.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.17.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.17.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.17.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.17.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.17.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.17.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.18.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.18.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.18.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.18.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.18.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.18.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.19.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.19.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.19.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.19.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.19.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.19.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.2.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.2.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.2.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.2.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.2.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.2.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.20.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.20.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.20.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.20.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.20.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.20.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.21.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.21.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.21.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.21.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.21.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.21.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.22.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.22.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.22.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.22.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.22.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.22.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.23.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.23.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.23.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.23.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.23.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.23.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.24.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.24.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.24.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.24.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.24.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.24.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.25.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.25.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.25.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.25.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.25.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.25.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.26.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.26.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.26.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.26.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.26.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.26.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.27.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.27.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.27.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.27.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.27.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.27.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.28.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.28.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.28.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.28.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.28.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.28.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.29.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.29.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.29.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.29.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.29.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.29.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.3.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.3.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.3.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.3.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.3.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.3.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.30.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.30.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.30.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.30.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.30.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.30.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.31.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.31.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.31.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.31.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.31.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.31.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.32.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.32.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.32.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.32.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.32.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.32.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.33.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.33.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.33.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.33.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.33.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.33.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.34.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.34.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.34.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.34.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.34.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.34.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.35.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.35.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.35.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.35.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.35.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.35.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.36.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.36.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.36.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.36.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.36.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.36.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.37.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.37.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.37.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.37.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.37.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.37.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.38.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.38.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.38.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.38.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.38.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.38.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.39.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.39.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.39.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.39.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.39.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.39.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.4.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.4.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.4.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.4.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.4.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.4.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.40.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.40.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.40.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.40.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.40.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.40.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.41.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.41.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.41.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.41.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.41.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.41.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.42.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.42.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.42.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.42.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.42.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.42.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.43.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.43.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.43.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.43.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.43.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.43.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.44.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.44.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.44.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.44.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.44.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.44.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.45.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.45.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.45.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.45.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.45.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.45.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.46.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.46.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.46.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.46.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.46.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.46.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.47.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.47.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.47.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.47.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.47.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.47.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.48.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.48.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.48.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.48.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.48.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.48.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.49.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.49.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.49.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.49.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.49.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.49.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.5.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.5.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.5.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.5.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.5.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.5.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.50.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.50.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.50.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.50.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.50.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.50.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.51.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.51.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.51.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.51.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.51.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.51.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.52.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.52.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.52.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.52.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.52.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.52.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.53.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.53.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.53.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.53.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.53.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.53.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.54.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.54.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.54.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.54.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.54.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.54.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.55.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.55.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.55.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.55.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.55.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.55.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.56.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.56.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.56.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.56.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.56.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.56.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.57.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.57.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.57.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.57.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.57.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.57.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.58.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.58.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.58.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.58.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.58.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.58.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.59.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.59.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.59.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.59.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.59.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.59.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.6.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.6.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.6.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.6.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.6.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.6.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.60.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.60.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.60.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.60.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.60.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.60.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.61.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.61.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.61.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.61.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.61.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.61.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.62.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.62.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.62.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.62.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.62.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.62.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.63.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.63.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.63.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.63.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.63.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.63.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.64.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.64.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.64.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.64.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.64.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.64.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.65.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.65.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.65.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.65.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.65.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.65.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.66.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.66.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.66.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.66.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.66.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.66.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.67.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.67.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.67.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.67.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.67.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.67.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.68.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.68.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.68.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.68.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.68.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.68.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.69.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.69.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.69.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.69.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.69.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.69.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.7.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.7.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.7.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.7.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.7.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.7.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.70.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.70.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.70.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.70.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.70.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.70.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.71.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.71.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.71.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.71.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.71.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.71.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.72.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.72.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.72.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.72.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.72.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.72.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.73.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.73.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.73.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.73.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.73.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.73.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.74.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.74.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.74.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.74.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.74.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.74.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.75.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.75.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.75.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.75.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.75.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.75.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.76.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.76.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.76.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.76.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.76.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.76.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.77.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.77.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.77.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.77.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.77.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.77.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.78.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.78.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.78.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.78.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.78.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.78.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.79.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.79.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.79.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.79.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.79.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.79.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.8.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.8.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.8.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.8.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.8.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.8.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.80.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.80.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.80.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.80.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.80.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.80.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.81.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.81.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.81.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.81.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.81.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.81.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.82.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.82.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.82.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.82.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.82.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.82.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.83.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.83.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.83.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.83.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.83.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.83.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.84.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.84.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.84.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.84.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.84.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.84.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.85.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.85.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.85.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.85.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.85.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.85.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.86.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.86.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.86.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.86.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.86.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.86.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.87.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.87.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.87.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.87.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.87.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.87.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.88.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.88.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.88.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.88.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.88.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.88.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.89.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.89.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.89.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.89.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.89.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.89.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.9.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.9.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.9.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.9.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.9.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.9.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.90.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.90.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.90.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.90.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.90.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.90.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.91.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.91.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.91.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.91.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.91.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.91.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.92.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.92.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.92.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.92.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.92.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.92.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.93.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.93.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.93.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.93.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.93.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.93.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.94.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.94.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.94.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.94.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.94.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.94.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.95.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.95.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.95.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.95.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.95.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.95.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.96.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.96.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.96.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.96.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.96.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.96.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.97.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.97.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.97.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.97.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.97.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.97.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.98.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.98.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.98.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.98.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.98.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.98.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.99.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.99.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.99.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.99.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.99.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.experts.99.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.gate.e_score_correction_bias": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.gate.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.shared_experts.down_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.shared_experts.down_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.shared_experts.gate_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.shared_experts.gate_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.shared_experts.up_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.mlp.shared_experts.up_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.post_attention_layernorm.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.self_attn.k_norm.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.self_attn.k_proj.bias": "model-00021-of-00092.safetensors",
+ "model.layers.20.self_attn.k_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.self_attn.k_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.self_attn.o_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.self_attn.o_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.self_attn.q_norm.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.self_attn.q_proj.bias": "model-00021-of-00092.safetensors",
+ "model.layers.20.self_attn.q_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.self_attn.q_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.20.self_attn.v_proj.bias": "model-00021-of-00092.safetensors",
+ "model.layers.20.self_attn.v_proj.weight": "model-00021-of-00092.safetensors",
+ "model.layers.20.self_attn.v_proj.weight_scale": "model-00021-of-00092.safetensors",
+ "model.layers.21.input_layernorm.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.0.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.0.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.0.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.0.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.0.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.0.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.1.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.1.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.1.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.1.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.1.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.1.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.10.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.10.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.10.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.10.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.10.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.10.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.100.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.100.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.100.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.100.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.100.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.100.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.101.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.101.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.101.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.101.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.101.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.101.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.102.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.102.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.102.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.102.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.102.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.102.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.103.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.103.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.103.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.103.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.103.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.103.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.104.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.104.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.104.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.104.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.104.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.104.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.105.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.105.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.105.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.105.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.105.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.105.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.106.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.106.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.106.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.106.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.106.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.106.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.107.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.107.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.107.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.107.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.107.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.107.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.108.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.108.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.108.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.108.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.108.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.108.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.109.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.109.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.109.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.109.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.109.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.109.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.11.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.11.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.11.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.11.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.11.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.11.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.110.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.110.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.110.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.110.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.110.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.110.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.111.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.111.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.111.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.111.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.111.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.111.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.112.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.112.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.112.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.112.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.112.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.112.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.113.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.113.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.113.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.113.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.113.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.113.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.114.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.114.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.114.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.114.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.114.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.114.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.115.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.115.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.115.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.115.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.115.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.115.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.116.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.116.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.116.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.116.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.116.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.116.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.117.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.117.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.117.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.117.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.117.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.117.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.118.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.118.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.118.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.118.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.118.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.118.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.119.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.119.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.119.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.119.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.119.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.119.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.12.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.12.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.12.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.12.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.12.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.12.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.120.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.120.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.120.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.120.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.120.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.120.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.121.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.121.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.121.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.121.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.121.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.121.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.122.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.122.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.122.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.122.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.122.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.122.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.123.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.123.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.123.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.123.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.123.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.123.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.124.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.124.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.124.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.124.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.124.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.124.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.125.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.125.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.125.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.125.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.125.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.125.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.126.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.126.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.126.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.126.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.126.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.126.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.127.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.127.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.127.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.127.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.127.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.127.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.128.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.128.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.128.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.128.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.128.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.128.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.129.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.129.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.129.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.129.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.129.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.129.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.13.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.13.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.13.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.13.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.13.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.13.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.130.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.130.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.130.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.130.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.130.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.130.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.131.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.131.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.131.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.131.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.131.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.131.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.132.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.132.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.132.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.132.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.132.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.132.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.133.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.133.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.133.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.133.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.133.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.133.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.134.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.134.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.134.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.134.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.134.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.134.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.135.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.135.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.135.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.135.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.135.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.135.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.136.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.136.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.136.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.136.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.136.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.136.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.137.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.137.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.137.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.137.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.137.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.137.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.138.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.138.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.138.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.138.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.138.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.138.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.139.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.139.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.139.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.139.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.139.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.139.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.14.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.14.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.14.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.14.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.14.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.14.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.140.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.140.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.140.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.140.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.140.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.140.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.141.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.141.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.141.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.141.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.141.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.141.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.142.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.142.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.142.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.142.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.142.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.142.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.143.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.143.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.143.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.143.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.143.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.143.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.144.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.144.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.144.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.144.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.144.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.144.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.145.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.145.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.145.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.145.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.145.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.145.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.146.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.146.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.146.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.146.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.146.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.146.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.147.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.147.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.147.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.147.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.147.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.147.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.148.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.148.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.148.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.148.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.148.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.148.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.149.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.149.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.149.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.149.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.149.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.149.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.15.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.15.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.15.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.15.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.15.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.15.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.150.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.150.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.150.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.150.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.150.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.150.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.151.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.151.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.151.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.151.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.151.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.151.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.152.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.152.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.152.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.152.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.152.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.152.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.153.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.153.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.153.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.153.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.153.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.153.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.154.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.154.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.154.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.154.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.154.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.154.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.155.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.155.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.155.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.155.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.155.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.155.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.156.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.156.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.156.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.156.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.156.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.156.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.157.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.157.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.157.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.157.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.157.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.157.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.158.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.158.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.158.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.158.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.158.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.158.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.159.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.159.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.159.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.159.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.159.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.159.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.16.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.16.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.16.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.16.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.16.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.16.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.17.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.17.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.17.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.17.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.17.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.17.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.18.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.18.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.18.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.18.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.18.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.18.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.19.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.19.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.19.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.19.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.19.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.19.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.2.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.2.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.2.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.2.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.2.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.2.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.20.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.20.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.20.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.20.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.20.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.20.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.21.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.21.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.21.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.21.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.21.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.21.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.22.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.22.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.22.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.22.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.22.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.22.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.23.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.23.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.23.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.23.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.23.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.23.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.24.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.24.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.24.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.24.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.24.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.24.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.25.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.25.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.25.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.25.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.25.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.25.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.26.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.26.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.26.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.26.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.26.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.26.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.27.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.27.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.27.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.27.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.27.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.27.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.28.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.28.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.28.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.28.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.28.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.28.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.29.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.29.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.29.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.29.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.29.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.29.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.3.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.3.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.3.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.3.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.3.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.3.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.30.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.30.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.30.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.30.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.30.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.30.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.31.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.31.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.31.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.31.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.31.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.31.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.32.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.32.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.32.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.32.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.32.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.32.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.33.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.33.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.33.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.33.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.33.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.33.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.34.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.34.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.34.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.34.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.34.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.34.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.35.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.35.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.35.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.35.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.35.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.35.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.36.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.36.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.36.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.36.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.36.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.36.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.37.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.37.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.37.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.37.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.37.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.37.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.38.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.38.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.38.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.38.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.38.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.38.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.39.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.39.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.39.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.39.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.39.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.39.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.4.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.4.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.4.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.4.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.4.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.4.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.40.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.40.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.40.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.40.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.40.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.40.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.41.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.41.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.41.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.41.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.41.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.41.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.42.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.42.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.42.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.42.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.42.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.42.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.43.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.43.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.43.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.43.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.43.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.43.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.44.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.44.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.44.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.44.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.44.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.44.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.45.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.45.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.45.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.45.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.45.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.45.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.46.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.46.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.46.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.46.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.46.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.46.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.47.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.47.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.47.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.47.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.47.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.47.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.48.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.48.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.48.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.48.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.48.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.48.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.49.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.49.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.49.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.49.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.49.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.49.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.5.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.5.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.5.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.5.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.5.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.5.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.50.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.50.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.50.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.50.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.50.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.50.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.51.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.51.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.51.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.51.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.51.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.51.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.52.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.52.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.52.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.52.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.52.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.52.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.53.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.53.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.53.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.53.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.53.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.53.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.54.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.54.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.54.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.54.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.54.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.54.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.55.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.55.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.55.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.55.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.55.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.55.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.56.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.56.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.56.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.56.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.56.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.56.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.57.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.57.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.57.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.57.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.57.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.57.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.58.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.58.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.58.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.58.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.58.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.58.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.59.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.59.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.59.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.59.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.59.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.59.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.6.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.6.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.6.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.6.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.6.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.6.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.60.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.60.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.60.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.60.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.60.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.60.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.61.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.61.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.61.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.61.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.61.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.61.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.62.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.62.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.62.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.62.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.62.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.62.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.63.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.63.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.63.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.63.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.63.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.63.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.64.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.64.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.64.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.64.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.64.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.64.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.65.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.65.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.65.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.65.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.65.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.65.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.66.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.66.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.66.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.66.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.66.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.66.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.67.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.67.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.67.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.67.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.67.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.67.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.68.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.68.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.68.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.68.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.68.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.68.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.69.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.69.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.69.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.69.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.69.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.69.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.7.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.7.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.7.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.7.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.7.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.7.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.70.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.70.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.70.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.70.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.70.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.70.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.71.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.71.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.71.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.71.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.71.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.71.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.72.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.72.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.72.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.72.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.72.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.72.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.73.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.73.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.73.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.73.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.73.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.73.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.74.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.74.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.74.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.74.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.74.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.74.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.75.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.75.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.75.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.75.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.75.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.75.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.76.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.76.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.76.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.76.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.76.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.76.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.77.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.77.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.77.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.77.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.77.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.77.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.78.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.78.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.78.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.78.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.78.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.78.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.79.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.79.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.79.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.79.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.79.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.79.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.8.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.8.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.8.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.8.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.8.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.8.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.80.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.80.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.80.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.80.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.80.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.80.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.81.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.81.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.81.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.81.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.81.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.81.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.82.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.82.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.82.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.82.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.82.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.82.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.83.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.83.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.83.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.83.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.83.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.83.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.84.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.84.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.84.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.84.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.84.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.84.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.85.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.85.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.85.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.85.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.85.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.85.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.86.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.86.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.86.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.86.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.86.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.86.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.87.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.87.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.87.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.87.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.87.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.87.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.88.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.88.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.88.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.88.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.88.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.88.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.89.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.89.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.89.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.89.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.89.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.89.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.9.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.9.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.9.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.9.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.9.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.9.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.90.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.90.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.90.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.90.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.90.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.90.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.91.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.91.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.91.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.91.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.91.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.91.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.92.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.92.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.92.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.92.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.92.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.92.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.93.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.93.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.93.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.93.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.93.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.93.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.94.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.94.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.94.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.94.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.94.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.94.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.95.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.95.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.95.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.95.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.95.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.95.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.96.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.96.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.96.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.96.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.96.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.96.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.97.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.97.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.97.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.97.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.97.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.97.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.98.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.98.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.98.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.98.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.98.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.98.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.99.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.99.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.99.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.99.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.99.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.experts.99.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.gate.e_score_correction_bias": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.gate.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.shared_experts.down_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.shared_experts.down_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.shared_experts.gate_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.shared_experts.gate_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.shared_experts.up_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.mlp.shared_experts.up_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.post_attention_layernorm.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.self_attn.k_norm.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.self_attn.k_proj.bias": "model-00022-of-00092.safetensors",
+ "model.layers.21.self_attn.k_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.self_attn.k_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.self_attn.o_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.self_attn.o_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.self_attn.q_norm.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.self_attn.q_proj.bias": "model-00022-of-00092.safetensors",
+ "model.layers.21.self_attn.q_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.self_attn.q_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.21.self_attn.v_proj.bias": "model-00022-of-00092.safetensors",
+ "model.layers.21.self_attn.v_proj.weight": "model-00022-of-00092.safetensors",
+ "model.layers.21.self_attn.v_proj.weight_scale": "model-00022-of-00092.safetensors",
+ "model.layers.22.input_layernorm.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.0.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.0.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.0.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.0.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.0.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.0.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.1.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.1.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.1.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.1.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.1.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.1.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.10.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.10.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.10.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.10.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.10.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.10.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.100.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.100.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.100.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.100.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.100.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.100.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.101.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.101.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.101.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.101.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.101.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.101.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.102.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.102.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.102.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.102.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.102.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.102.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.103.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.103.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.103.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.103.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.103.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.103.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.104.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.104.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.104.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.104.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.104.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.104.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.105.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.105.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.105.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.105.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.105.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.105.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.106.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.106.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.106.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.106.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.106.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.106.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.107.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.107.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.107.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.107.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.107.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.107.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.108.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.108.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.108.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.108.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.108.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.108.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.109.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.109.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.109.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.109.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.109.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.109.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.11.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.11.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.11.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.11.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.11.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.11.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.110.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.110.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.110.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.110.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.110.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.110.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.111.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.111.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.111.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.111.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.111.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.111.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.112.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.112.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.112.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.112.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.112.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.112.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.113.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.113.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.113.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.113.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.113.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.113.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.114.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.114.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.114.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.114.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.114.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.114.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.115.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.115.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.115.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.115.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.115.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.115.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.116.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.116.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.116.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.116.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.116.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.116.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.117.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.117.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.117.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.117.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.117.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.117.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.118.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.118.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.118.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.118.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.118.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.118.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.119.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.119.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.119.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.119.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.119.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.119.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.12.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.12.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.12.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.12.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.12.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.12.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.120.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.120.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.120.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.120.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.120.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.120.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.121.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.121.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.121.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.121.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.121.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.121.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.122.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.122.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.122.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.122.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.122.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.122.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.123.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.123.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.123.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.123.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.123.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.123.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.124.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.124.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.124.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.124.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.124.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.124.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.125.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.125.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.125.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.125.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.125.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.125.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.126.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.126.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.126.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.126.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.126.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.126.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.127.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.127.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.127.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.127.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.127.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.127.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.128.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.128.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.128.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.128.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.128.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.128.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.129.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.129.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.129.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.129.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.129.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.129.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.13.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.13.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.13.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.13.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.13.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.13.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.130.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.130.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.130.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.130.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.130.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.130.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.131.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.131.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.131.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.131.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.131.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.131.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.132.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.132.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.132.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.132.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.132.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.132.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.133.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.133.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.133.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.133.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.133.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.133.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.134.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.134.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.134.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.134.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.134.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.134.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.135.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.135.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.135.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.135.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.135.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.135.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.136.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.136.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.136.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.136.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.136.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.136.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.137.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.137.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.137.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.137.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.137.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.137.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.138.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.138.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.138.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.138.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.138.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.138.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.139.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.139.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.139.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.139.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.139.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.139.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.14.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.14.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.14.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.14.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.14.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.14.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.140.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.140.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.140.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.140.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.140.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.140.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.141.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.141.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.141.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.141.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.141.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.141.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.142.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.142.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.142.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.142.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.142.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.142.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.143.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.143.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.143.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.143.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.143.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.143.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.144.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.144.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.144.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.144.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.144.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.144.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.145.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.145.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.145.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.145.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.145.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.145.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.146.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.146.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.146.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.146.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.146.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.146.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.147.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.147.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.147.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.147.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.147.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.147.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.148.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.148.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.148.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.148.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.148.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.148.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.149.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.149.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.149.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.149.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.149.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.149.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.15.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.15.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.15.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.15.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.15.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.15.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.150.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.150.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.150.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.150.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.150.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.150.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.151.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.151.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.151.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.151.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.151.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.151.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.152.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.152.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.152.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.152.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.152.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.152.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.153.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.153.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.153.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.153.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.153.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.153.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.154.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.154.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.154.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.154.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.154.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.154.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.155.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.155.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.155.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.155.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.155.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.155.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.156.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.156.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.156.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.156.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.156.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.156.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.157.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.157.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.157.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.157.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.157.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.157.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.158.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.158.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.158.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.158.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.158.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.158.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.159.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.159.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.159.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.159.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.159.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.159.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.16.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.16.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.16.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.16.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.16.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.16.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.17.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.17.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.17.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.17.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.17.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.17.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.18.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.18.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.18.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.18.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.18.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.18.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.19.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.19.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.19.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.19.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.19.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.19.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.2.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.2.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.2.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.2.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.2.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.2.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.20.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.20.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.20.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.20.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.20.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.20.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.21.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.21.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.21.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.21.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.21.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.21.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.22.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.22.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.22.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.22.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.22.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.22.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.23.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.23.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.23.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.23.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.23.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.23.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.24.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.24.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.24.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.24.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.24.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.24.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.25.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.25.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.25.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.25.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.25.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.25.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.26.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.26.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.26.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.26.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.26.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.26.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.27.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.27.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.27.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.27.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.27.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.27.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.28.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.28.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.28.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.28.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.28.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.28.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.29.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.29.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.29.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.29.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.29.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.29.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.3.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.3.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.3.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.3.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.3.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.3.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.30.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.30.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.30.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.30.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.30.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.30.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.31.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.31.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.31.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.31.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.31.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.31.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.32.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.32.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.32.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.32.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.32.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.32.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.33.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.33.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.33.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.33.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.33.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.33.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.34.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.34.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.34.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.34.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.34.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.34.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.35.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.35.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.35.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.35.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.35.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.35.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.36.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.36.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.36.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.36.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.36.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.36.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.37.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.37.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.37.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.37.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.37.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.37.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.38.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.38.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.38.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.38.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.38.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.38.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.39.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.39.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.39.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.39.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.39.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.39.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.4.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.4.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.4.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.4.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.4.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.4.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.40.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.40.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.40.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.40.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.40.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.40.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.41.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.41.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.41.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.41.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.41.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.41.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.42.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.42.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.42.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.42.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.42.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.42.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.43.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.43.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.43.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.43.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.43.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.43.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.44.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.44.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.44.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.44.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.44.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.44.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.45.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.45.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.45.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.45.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.45.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.45.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.46.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.46.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.46.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.46.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.46.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.46.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.47.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.47.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.47.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.47.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.47.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.47.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.48.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.48.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.48.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.48.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.48.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.48.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.49.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.49.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.49.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.49.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.49.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.49.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.5.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.5.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.5.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.5.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.5.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.5.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.50.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.50.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.50.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.50.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.50.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.50.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.51.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.51.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.51.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.51.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.51.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.51.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.52.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.52.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.52.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.52.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.52.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.52.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.53.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.53.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.53.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.53.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.53.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.53.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.54.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.54.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.54.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.54.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.54.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.54.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.55.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.55.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.55.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.55.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.55.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.55.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.56.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.56.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.56.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.56.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.56.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.56.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.57.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.57.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.57.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.57.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.57.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.57.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.58.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.58.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.58.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.58.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.58.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.58.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.59.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.59.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.59.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.59.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.59.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.59.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.6.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.6.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.6.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.6.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.6.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.6.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.60.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.60.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.60.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.60.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.60.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.60.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.61.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.61.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.61.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.61.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.61.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.61.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.62.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.62.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.62.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.62.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.62.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.62.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.63.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.63.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.63.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.63.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.63.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.63.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.64.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.64.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.64.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.64.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.64.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.64.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.65.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.65.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.65.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.65.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.65.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.65.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.66.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.66.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.66.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.66.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.66.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.66.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.67.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.67.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.67.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.67.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.67.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.67.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.68.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.68.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.68.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.68.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.68.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.68.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.69.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.69.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.69.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.69.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.69.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.69.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.7.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.7.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.7.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.7.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.7.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.7.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.70.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.70.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.70.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.70.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.70.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.70.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.71.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.71.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.71.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.71.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.71.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.71.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.72.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.72.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.72.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.72.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.72.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.72.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.73.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.73.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.73.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.73.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.73.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.73.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.74.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.74.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.74.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.74.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.74.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.74.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.75.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.75.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.75.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.75.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.75.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.75.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.76.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.76.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.76.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.76.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.76.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.76.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.77.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.77.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.77.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.77.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.77.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.77.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.78.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.78.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.78.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.78.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.78.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.78.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.79.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.79.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.79.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.79.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.79.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.79.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.8.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.8.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.8.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.8.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.8.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.8.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.80.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.80.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.80.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.80.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.80.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.80.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.81.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.81.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.81.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.81.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.81.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.81.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.82.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.82.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.82.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.82.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.82.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.82.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.83.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.83.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.83.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.83.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.83.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.83.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.84.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.84.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.84.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.84.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.84.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.84.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.85.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.85.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.85.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.85.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.85.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.85.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.86.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.86.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.86.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.86.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.86.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.86.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.87.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.87.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.87.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.87.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.87.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.87.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.88.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.88.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.88.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.88.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.88.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.88.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.89.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.89.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.89.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.89.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.89.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.89.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.9.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.9.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.9.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.9.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.9.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.9.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.90.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.90.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.90.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.90.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.90.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.90.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.91.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.91.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.91.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.91.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.91.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.91.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.92.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.92.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.92.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.92.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.92.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.92.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.93.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.93.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.93.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.93.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.93.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.93.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.94.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.94.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.94.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.94.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.94.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.94.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.95.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.95.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.95.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.95.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.95.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.95.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.96.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.96.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.96.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.96.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.96.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.96.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.97.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.97.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.97.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.97.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.97.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.97.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.98.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.98.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.98.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.98.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.98.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.98.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.99.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.99.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.99.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.99.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.99.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.experts.99.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.gate.e_score_correction_bias": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.gate.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.shared_experts.down_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.shared_experts.down_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.shared_experts.gate_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.shared_experts.gate_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.shared_experts.up_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.mlp.shared_experts.up_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.post_attention_layernorm.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.self_attn.k_norm.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.self_attn.k_proj.bias": "model-00023-of-00092.safetensors",
+ "model.layers.22.self_attn.k_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.self_attn.k_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.self_attn.o_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.self_attn.o_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.self_attn.q_norm.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.self_attn.q_proj.bias": "model-00023-of-00092.safetensors",
+ "model.layers.22.self_attn.q_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.self_attn.q_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.22.self_attn.v_proj.bias": "model-00023-of-00092.safetensors",
+ "model.layers.22.self_attn.v_proj.weight": "model-00023-of-00092.safetensors",
+ "model.layers.22.self_attn.v_proj.weight_scale": "model-00023-of-00092.safetensors",
+ "model.layers.23.input_layernorm.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.0.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.0.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.0.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.0.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.0.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.0.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.1.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.1.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.1.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.1.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.1.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.1.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.10.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.10.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.10.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.10.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.10.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.10.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.100.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.100.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.100.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.100.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.100.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.100.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.101.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.101.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.101.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.101.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.101.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.101.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.102.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.102.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.102.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.102.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.102.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.102.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.103.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.103.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.103.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.103.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.103.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.103.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.104.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.104.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.104.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.104.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.104.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.104.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.105.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.105.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.105.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.105.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.105.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.105.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.106.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.106.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.106.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.106.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.106.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.106.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.107.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.107.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.107.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.107.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.107.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.107.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.108.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.108.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.108.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.108.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.108.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.108.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.109.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.109.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.109.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.109.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.109.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.109.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.11.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.11.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.11.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.11.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.11.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.11.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.110.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.110.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.110.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.110.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.110.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.110.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.111.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.111.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.111.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.111.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.111.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.111.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.112.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.112.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.112.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.112.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.112.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.112.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.113.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.113.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.113.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.113.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.113.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.113.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.114.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.114.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.114.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.114.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.114.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.114.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.115.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.115.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.115.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.115.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.115.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.115.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.116.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.116.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.116.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.116.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.116.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.116.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.117.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.117.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.117.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.117.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.117.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.117.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.118.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.118.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.118.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.118.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.118.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.118.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.119.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.119.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.119.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.119.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.119.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.119.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.12.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.12.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.12.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.12.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.12.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.12.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.120.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.120.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.120.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.120.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.120.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.120.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.121.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.121.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.121.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.121.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.121.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.121.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.122.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.122.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.122.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.122.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.122.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.122.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.123.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.123.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.123.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.123.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.123.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.123.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.124.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.124.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.124.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.124.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.124.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.124.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.125.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.125.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.125.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.125.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.125.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.125.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.126.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.126.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.126.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.126.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.126.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.126.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.127.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.127.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.127.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.127.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.127.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.127.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.128.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.128.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.128.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.128.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.128.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.128.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.129.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.129.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.129.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.129.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.129.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.129.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.13.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.13.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.13.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.13.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.13.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.13.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.130.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.130.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.130.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.130.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.130.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.130.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.131.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.131.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.131.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.131.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.131.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.131.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.132.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.132.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.132.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.132.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.132.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.132.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.133.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.133.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.133.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.133.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.133.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.133.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.134.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.134.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.134.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.134.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.134.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.134.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.135.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.135.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.135.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.135.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.135.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.135.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.136.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.136.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.136.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.136.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.136.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.136.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.137.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.137.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.137.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.137.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.137.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.137.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.138.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.138.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.138.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.138.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.138.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.138.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.139.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.139.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.139.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.139.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.139.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.139.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.14.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.14.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.14.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.14.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.14.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.14.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.140.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.140.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.140.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.140.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.140.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.140.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.141.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.141.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.141.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.141.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.141.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.141.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.142.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.142.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.142.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.142.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.142.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.142.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.143.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.143.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.143.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.143.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.143.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.143.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.144.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.144.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.144.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.144.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.144.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.144.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.145.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.145.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.145.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.145.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.145.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.145.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.146.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.146.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.146.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.146.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.146.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.146.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.147.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.147.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.147.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.147.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.147.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.147.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.148.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.148.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.148.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.148.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.148.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.148.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.149.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.149.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.149.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.149.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.149.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.149.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.15.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.15.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.15.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.15.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.15.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.15.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.150.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.150.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.150.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.150.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.150.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.150.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.151.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.151.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.151.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.151.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.151.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.151.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.152.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.152.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.152.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.152.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.152.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.152.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.153.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.153.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.153.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.153.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.153.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.153.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.154.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.154.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.154.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.154.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.154.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.154.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.155.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.155.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.155.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.155.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.155.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.155.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.156.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.156.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.156.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.156.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.156.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.156.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.157.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.157.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.157.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.157.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.157.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.157.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.158.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.158.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.158.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.158.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.158.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.158.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.159.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.159.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.159.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.159.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.159.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.159.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.16.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.16.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.16.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.16.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.16.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.16.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.17.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.17.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.17.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.17.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.17.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.17.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.18.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.18.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.18.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.18.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.18.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.18.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.19.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.19.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.19.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.19.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.19.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.19.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.2.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.2.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.2.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.2.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.2.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.2.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.20.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.20.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.20.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.20.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.20.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.20.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.21.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.21.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.21.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.21.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.21.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.21.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.22.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.22.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.22.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.22.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.22.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.22.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.23.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.23.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.23.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.23.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.23.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.23.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.24.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.24.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.24.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.24.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.24.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.24.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.25.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.25.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.25.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.25.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.25.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.25.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.26.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.26.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.26.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.26.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.26.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.26.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.27.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.27.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.27.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.27.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.27.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.27.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.28.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.28.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.28.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.28.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.28.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.28.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.29.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.29.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.29.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.29.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.29.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.29.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.3.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.3.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.3.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.3.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.3.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.3.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.30.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.30.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.30.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.30.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.30.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.30.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.31.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.31.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.31.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.31.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.31.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.31.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.32.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.32.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.32.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.32.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.32.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.32.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.33.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.33.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.33.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.33.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.33.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.33.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.34.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.34.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.34.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.34.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.34.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.34.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.35.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.35.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.35.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.35.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.35.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.35.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.36.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.36.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.36.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.36.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.36.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.36.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.37.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.37.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.37.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.37.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.37.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.37.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.38.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.38.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.38.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.38.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.38.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.38.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.39.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.39.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.39.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.39.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.39.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.39.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.4.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.4.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.4.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.4.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.4.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.4.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.40.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.40.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.40.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.40.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.40.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.40.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.41.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.41.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.41.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.41.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.41.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.41.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.42.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.42.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.42.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.42.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.42.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.42.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.43.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.43.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.43.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.43.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.43.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.43.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.44.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.44.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.44.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.44.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.44.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.44.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.45.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.45.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.45.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.45.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.45.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.45.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.46.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.46.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.46.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.46.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.46.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.46.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.47.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.47.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.47.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.47.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.47.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.47.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.48.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.48.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.48.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.48.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.48.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.48.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.49.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.49.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.49.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.49.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.49.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.49.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.5.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.5.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.5.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.5.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.5.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.5.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.50.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.50.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.50.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.50.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.50.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.50.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.51.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.51.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.51.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.51.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.51.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.51.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.52.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.52.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.52.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.52.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.52.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.52.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.53.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.53.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.53.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.53.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.53.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.53.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.54.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.54.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.54.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.54.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.54.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.54.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.55.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.55.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.55.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.55.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.55.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.55.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.56.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.56.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.56.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.56.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.56.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.56.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.57.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.57.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.57.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.57.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.57.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.57.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.58.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.58.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.58.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.58.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.58.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.58.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.59.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.59.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.59.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.59.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.59.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.59.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.6.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.6.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.6.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.6.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.6.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.6.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.60.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.60.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.60.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.60.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.60.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.60.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.61.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.61.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.61.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.61.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.61.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.61.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.62.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.62.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.62.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.62.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.62.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.62.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.63.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.63.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.63.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.63.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.63.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.63.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.64.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.64.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.64.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.64.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.64.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.64.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.65.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.65.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.65.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.65.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.65.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.65.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.66.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.66.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.66.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.66.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.66.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.66.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.67.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.67.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.67.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.67.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.67.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.67.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.68.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.68.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.68.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.68.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.68.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.68.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.69.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.69.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.69.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.69.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.69.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.69.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.7.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.7.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.7.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.7.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.7.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.7.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.70.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.70.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.70.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.70.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.70.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.70.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.71.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.71.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.71.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.71.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.71.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.71.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.72.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.72.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.72.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.72.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.72.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.72.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.73.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.73.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.73.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.73.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.73.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.73.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.74.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.74.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.74.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.74.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.74.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.74.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.75.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.75.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.75.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.75.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.75.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.75.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.76.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.76.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.76.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.76.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.76.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.76.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.77.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.77.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.77.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.77.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.77.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.77.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.78.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.78.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.78.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.78.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.78.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.78.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.79.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.79.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.79.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.79.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.79.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.79.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.8.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.8.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.8.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.8.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.8.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.8.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.80.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.80.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.80.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.80.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.80.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.80.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.81.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.81.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.81.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.81.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.81.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.81.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.82.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.82.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.82.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.82.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.82.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.82.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.83.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.83.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.83.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.83.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.83.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.83.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.84.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.84.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.84.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.84.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.84.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.84.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.85.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.85.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.85.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.85.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.85.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.85.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.86.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.86.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.86.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.86.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.86.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.86.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.87.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.87.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.87.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.87.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.87.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.87.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.88.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.88.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.88.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.88.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.88.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.88.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.89.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.89.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.89.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.89.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.89.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.89.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.9.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.9.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.9.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.9.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.9.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.9.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.90.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.90.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.90.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.90.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.90.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.90.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.91.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.91.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.91.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.91.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.91.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.91.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.92.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.92.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.92.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.92.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.92.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.92.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.93.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.93.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.93.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.93.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.93.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.93.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.94.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.94.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.94.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.94.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.94.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.94.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.95.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.95.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.95.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.95.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.95.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.95.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.96.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.96.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.96.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.96.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.96.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.96.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.97.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.97.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.97.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.97.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.97.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.97.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.98.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.98.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.98.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.98.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.98.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.98.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.99.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.99.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.99.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.99.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.99.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.experts.99.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.gate.e_score_correction_bias": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.gate.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.shared_experts.down_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.shared_experts.down_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.shared_experts.gate_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.shared_experts.gate_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.shared_experts.up_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.mlp.shared_experts.up_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.post_attention_layernorm.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.self_attn.k_norm.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.self_attn.k_proj.bias": "model-00024-of-00092.safetensors",
+ "model.layers.23.self_attn.k_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.self_attn.k_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.self_attn.o_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.self_attn.o_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.self_attn.q_norm.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.self_attn.q_proj.bias": "model-00024-of-00092.safetensors",
+ "model.layers.23.self_attn.q_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.self_attn.q_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.23.self_attn.v_proj.bias": "model-00024-of-00092.safetensors",
+ "model.layers.23.self_attn.v_proj.weight": "model-00024-of-00092.safetensors",
+ "model.layers.23.self_attn.v_proj.weight_scale": "model-00024-of-00092.safetensors",
+ "model.layers.24.input_layernorm.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.0.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.0.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.0.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.0.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.0.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.0.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.1.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.1.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.1.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.1.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.1.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.1.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.10.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.10.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.10.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.10.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.10.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.10.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.100.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.100.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.100.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.100.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.100.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.100.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.101.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.101.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.101.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.101.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.101.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.101.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.102.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.102.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.102.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.102.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.102.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.102.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.103.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.103.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.103.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.103.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.103.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.103.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.104.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.104.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.104.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.104.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.104.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.104.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.105.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.105.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.105.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.105.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.105.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.105.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.106.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.106.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.106.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.106.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.106.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.106.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.107.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.107.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.107.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.107.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.107.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.107.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.108.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.108.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.108.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.108.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.108.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.108.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.109.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.109.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.109.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.109.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.109.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.109.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.11.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.11.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.11.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.11.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.11.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.11.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.110.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.110.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.110.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.110.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.110.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.110.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.111.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.111.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.111.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.111.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.111.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.111.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.112.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.112.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.112.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.112.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.112.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.112.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.113.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.113.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.113.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.113.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.113.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.113.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.114.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.114.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.114.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.114.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.114.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.114.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.115.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.115.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.115.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.115.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.115.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.115.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.116.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.116.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.116.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.116.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.116.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.116.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.117.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.117.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.117.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.117.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.117.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.117.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.118.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.118.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.118.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.118.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.118.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.118.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.119.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.119.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.119.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.119.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.119.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.119.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.12.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.12.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.12.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.12.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.12.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.12.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.120.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.120.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.120.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.120.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.120.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.120.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.121.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.121.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.121.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.121.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.121.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.121.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.122.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.122.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.122.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.122.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.122.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.122.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.123.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.123.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.123.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.123.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.123.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.123.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.124.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.124.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.124.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.124.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.124.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.124.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.125.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.125.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.125.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.125.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.125.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.125.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.126.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.126.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.126.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.126.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.126.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.126.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.127.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.127.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.127.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.127.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.127.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.127.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.128.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.128.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.128.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.128.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.128.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.128.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.129.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.129.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.129.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.129.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.129.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.129.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.13.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.13.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.13.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.13.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.13.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.13.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.130.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.130.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.130.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.130.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.130.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.130.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.131.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.131.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.131.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.131.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.131.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.131.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.132.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.132.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.132.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.132.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.132.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.132.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.133.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.133.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.133.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.133.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.133.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.133.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.134.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.134.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.134.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.134.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.134.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.134.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.135.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.135.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.135.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.135.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.135.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.135.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.136.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.136.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.136.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.136.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.136.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.136.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.137.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.137.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.137.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.137.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.137.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.137.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.138.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.138.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.138.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.138.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.138.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.138.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.139.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.139.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.139.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.139.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.139.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.139.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.14.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.14.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.14.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.14.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.14.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.14.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.140.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.140.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.140.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.140.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.140.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.140.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.141.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.141.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.141.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.141.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.141.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.141.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.142.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.142.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.142.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.142.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.142.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.142.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.143.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.143.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.143.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.143.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.143.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.143.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.144.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.144.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.144.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.144.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.144.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.144.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.145.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.145.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.145.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.145.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.145.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.145.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.146.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.146.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.146.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.146.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.146.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.146.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.147.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.147.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.147.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.147.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.147.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.147.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.148.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.148.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.148.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.148.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.148.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.148.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.149.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.149.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.149.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.149.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.149.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.149.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.15.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.15.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.15.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.15.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.15.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.15.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.150.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.150.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.150.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.150.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.150.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.150.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.151.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.151.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.151.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.151.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.151.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.151.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.152.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.152.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.152.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.152.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.152.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.152.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.153.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.153.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.153.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.153.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.153.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.153.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.154.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.154.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.154.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.154.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.154.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.154.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.155.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.155.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.155.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.155.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.155.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.155.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.156.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.156.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.156.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.156.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.156.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.156.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.157.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.157.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.157.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.157.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.157.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.157.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.158.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.158.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.158.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.158.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.158.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.158.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.159.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.159.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.159.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.159.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.159.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.159.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.16.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.16.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.16.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.16.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.16.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.16.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.17.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.17.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.17.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.17.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.17.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.17.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.18.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.18.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.18.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.18.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.18.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.18.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.19.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.19.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.19.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.19.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.19.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.19.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.2.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.2.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.2.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.2.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.2.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.2.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.20.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.20.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.20.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.20.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.20.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.20.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.21.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.21.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.21.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.21.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.21.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.21.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.22.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.22.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.22.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.22.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.22.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.22.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.23.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.23.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.23.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.23.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.23.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.23.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.24.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.24.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.24.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.24.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.24.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.24.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.25.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.25.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.25.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.25.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.25.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.25.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.26.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.26.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.26.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.26.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.26.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.26.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.27.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.27.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.27.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.27.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.27.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.27.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.28.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.28.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.28.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.28.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.28.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.28.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.29.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.29.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.29.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.29.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.29.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.29.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.3.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.3.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.3.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.3.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.3.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.3.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.30.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.30.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.30.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.30.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.30.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.30.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.31.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.31.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.31.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.31.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.31.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.31.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.32.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.32.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.32.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.32.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.32.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.32.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.33.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.33.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.33.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.33.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.33.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.33.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.34.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.34.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.34.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.34.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.34.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.34.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.35.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.35.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.35.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.35.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.35.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.35.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.36.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.36.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.36.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.36.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.36.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.36.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.37.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.37.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.37.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.37.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.37.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.37.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.38.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.38.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.38.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.38.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.38.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.38.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.39.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.39.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.39.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.39.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.39.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.39.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.4.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.4.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.4.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.4.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.4.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.4.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.40.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.40.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.40.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.40.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.40.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.40.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.41.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.41.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.41.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.41.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.41.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.41.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.42.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.42.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.42.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.42.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.42.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.42.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.43.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.43.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.43.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.43.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.43.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.43.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.44.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.44.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.44.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.44.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.44.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.44.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.45.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.45.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.45.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.45.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.45.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.45.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.46.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.46.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.46.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.46.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.46.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.46.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.47.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.47.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.47.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.47.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.47.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.47.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.48.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.48.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.48.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.48.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.48.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.48.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.49.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.49.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.49.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.49.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.49.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.49.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.5.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.5.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.5.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.5.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.5.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.5.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.50.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.50.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.50.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.50.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.50.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.50.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.51.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.51.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.51.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.51.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.51.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.51.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.52.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.52.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.52.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.52.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.52.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.52.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.53.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.53.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.53.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.53.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.53.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.53.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.54.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.54.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.54.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.54.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.54.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.54.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.55.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.55.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.55.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.55.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.55.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.55.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.56.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.56.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.56.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.56.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.56.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.56.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.57.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.57.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.57.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.57.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.57.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.57.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.58.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.58.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.58.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.58.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.58.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.58.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.59.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.59.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.59.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.59.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.59.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.59.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.6.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.6.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.6.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.6.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.6.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.6.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.60.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.60.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.60.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.60.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.60.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.60.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.61.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.61.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.61.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.61.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.61.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.61.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.62.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.62.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.62.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.62.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.62.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.62.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.63.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.63.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.63.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.63.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.63.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.63.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.64.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.64.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.64.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.64.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.64.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.64.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.65.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.65.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.65.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.65.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.65.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.65.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.66.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.66.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.66.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.66.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.66.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.66.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.67.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.67.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.67.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.67.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.67.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.67.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.68.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.68.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.68.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.68.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.68.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.68.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.69.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.69.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.69.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.69.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.69.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.69.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.7.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.7.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.7.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.7.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.7.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.7.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.70.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.70.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.70.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.70.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.70.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.70.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.71.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.71.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.71.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.71.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.71.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.71.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.72.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.72.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.72.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.72.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.72.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.72.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.73.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.73.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.73.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.73.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.73.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.73.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.74.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.74.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.74.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.74.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.74.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.74.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.75.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.75.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.75.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.75.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.75.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.75.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.76.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.76.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.76.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.76.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.76.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.76.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.77.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.77.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.77.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.77.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.77.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.77.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.78.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.78.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.78.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.78.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.78.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.78.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.79.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.79.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.79.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.79.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.79.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.79.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.8.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.8.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.8.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.8.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.8.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.8.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.80.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.80.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.80.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.80.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.80.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.80.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.81.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.81.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.81.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.81.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.81.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.81.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.82.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.82.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.82.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.82.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.82.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.82.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.83.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.83.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.83.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.83.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.83.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.83.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.84.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.84.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.84.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.84.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.84.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.84.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.85.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.85.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.85.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.85.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.85.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.85.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.86.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.86.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.86.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.86.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.86.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.86.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.87.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.87.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.87.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.87.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.87.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.87.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.88.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.88.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.88.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.88.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.88.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.88.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.89.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.89.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.89.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.89.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.89.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.89.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.9.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.9.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.9.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.9.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.9.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.9.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.90.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.90.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.90.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.90.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.90.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.90.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.91.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.91.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.91.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.91.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.91.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.91.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.92.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.92.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.92.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.92.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.92.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.92.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.93.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.93.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.93.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.93.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.93.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.93.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.94.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.94.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.94.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.94.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.94.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.94.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.95.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.95.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.95.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.95.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.95.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.95.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.96.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.96.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.96.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.96.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.96.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.96.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.97.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.97.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.97.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.97.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.97.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.97.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.98.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.98.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.98.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.98.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.98.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.98.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.99.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.99.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.99.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.99.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.99.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.experts.99.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.gate.e_score_correction_bias": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.gate.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.shared_experts.down_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.shared_experts.down_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.shared_experts.gate_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.shared_experts.gate_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.shared_experts.up_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.mlp.shared_experts.up_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.post_attention_layernorm.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.self_attn.k_norm.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.self_attn.k_proj.bias": "model-00025-of-00092.safetensors",
+ "model.layers.24.self_attn.k_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.self_attn.k_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.self_attn.o_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.self_attn.o_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.self_attn.q_norm.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.self_attn.q_proj.bias": "model-00025-of-00092.safetensors",
+ "model.layers.24.self_attn.q_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.self_attn.q_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.24.self_attn.v_proj.bias": "model-00025-of-00092.safetensors",
+ "model.layers.24.self_attn.v_proj.weight": "model-00025-of-00092.safetensors",
+ "model.layers.24.self_attn.v_proj.weight_scale": "model-00025-of-00092.safetensors",
+ "model.layers.25.input_layernorm.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.0.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.0.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.0.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.0.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.0.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.0.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.1.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.1.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.1.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.1.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.1.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.1.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.10.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.10.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.10.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.10.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.10.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.10.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.100.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.100.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.100.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.100.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.100.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.100.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.101.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.101.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.101.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.101.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.101.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.101.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.102.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.102.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.102.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.102.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.102.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.102.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.103.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.103.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.103.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.103.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.103.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.103.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.104.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.104.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.104.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.104.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.104.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.104.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.105.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.105.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.105.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.105.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.105.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.105.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.106.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.106.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.106.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.106.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.106.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.106.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.107.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.107.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.107.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.107.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.107.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.107.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.108.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.108.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.108.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.108.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.108.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.108.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.109.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.109.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.109.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.109.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.109.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.109.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.11.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.11.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.11.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.11.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.11.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.11.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.110.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.110.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.110.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.110.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.110.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.110.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.111.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.111.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.111.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.111.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.111.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.111.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.112.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.112.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.112.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.112.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.112.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.112.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.113.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.113.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.113.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.113.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.113.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.113.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.114.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.114.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.114.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.114.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.114.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.114.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.115.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.115.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.115.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.115.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.115.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.115.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.116.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.116.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.116.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.116.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.116.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.116.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.117.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.117.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.117.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.117.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.117.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.117.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.118.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.118.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.118.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.118.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.118.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.118.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.119.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.119.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.119.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.119.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.119.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.119.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.12.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.12.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.12.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.12.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.12.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.12.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.120.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.120.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.120.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.120.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.120.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.120.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.121.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.121.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.121.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.121.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.121.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.121.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.122.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.122.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.122.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.122.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.122.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.122.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.123.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.123.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.123.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.123.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.123.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.123.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.124.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.124.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.124.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.124.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.124.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.124.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.125.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.125.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.125.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.125.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.125.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.125.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.126.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.126.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.126.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.126.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.126.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.126.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.127.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.127.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.127.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.127.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.127.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.127.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.128.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.128.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.128.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.128.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.128.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.128.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.129.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.129.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.129.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.129.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.129.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.129.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.13.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.13.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.13.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.13.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.13.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.13.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.130.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.130.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.130.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.130.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.130.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.130.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.131.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.131.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.131.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.131.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.131.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.131.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.132.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.132.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.132.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.132.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.132.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.132.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.133.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.133.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.133.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.133.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.133.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.133.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.134.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.134.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.134.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.134.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.134.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.134.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.135.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.135.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.135.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.135.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.135.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.135.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.136.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.136.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.136.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.136.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.136.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.136.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.137.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.137.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.137.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.137.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.137.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.137.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.138.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.138.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.138.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.138.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.138.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.138.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.139.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.139.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.139.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.139.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.139.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.139.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.14.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.14.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.14.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.14.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.14.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.14.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.140.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.140.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.140.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.140.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.140.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.140.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.141.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.141.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.141.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.141.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.141.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.141.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.142.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.142.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.142.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.142.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.142.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.142.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.143.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.143.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.143.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.143.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.143.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.143.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.144.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.144.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.144.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.144.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.144.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.144.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.145.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.145.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.145.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.145.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.145.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.145.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.146.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.146.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.146.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.146.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.146.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.146.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.147.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.147.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.147.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.147.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.147.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.147.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.148.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.148.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.148.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.148.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.148.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.148.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.149.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.149.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.149.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.149.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.149.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.149.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.15.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.15.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.15.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.15.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.15.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.15.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.150.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.150.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.150.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.150.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.150.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.150.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.151.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.151.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.151.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.151.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.151.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.151.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.152.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.152.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.152.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.152.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.152.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.152.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.153.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.153.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.153.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.153.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.153.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.153.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.154.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.154.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.154.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.154.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.154.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.154.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.155.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.155.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.155.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.155.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.155.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.155.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.156.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.156.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.156.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.156.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.156.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.156.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.157.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.157.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.157.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.157.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.157.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.157.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.158.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.158.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.158.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.158.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.158.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.158.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.159.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.159.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.159.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.159.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.159.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.159.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.16.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.16.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.16.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.16.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.16.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.16.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.17.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.17.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.17.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.17.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.17.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.17.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.18.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.18.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.18.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.18.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.18.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.18.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.19.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.19.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.19.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.19.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.19.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.19.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.2.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.2.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.2.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.2.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.2.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.2.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.20.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.20.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.20.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.20.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.20.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.20.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.21.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.21.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.21.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.21.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.21.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.21.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.22.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.22.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.22.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.22.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.22.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.22.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.23.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.23.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.23.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.23.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.23.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.23.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.24.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.24.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.24.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.24.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.24.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.24.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.25.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.25.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.25.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.25.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.25.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.25.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.26.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.26.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.26.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.26.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.26.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.26.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.27.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.27.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.27.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.27.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.27.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.27.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.28.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.28.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.28.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.28.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.28.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.28.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.29.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.29.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.29.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.29.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.29.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.29.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.3.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.3.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.3.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.3.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.3.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.3.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.30.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.30.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.30.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.30.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.30.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.30.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.31.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.31.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.31.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.31.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.31.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.31.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.32.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.32.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.32.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.32.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.32.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.32.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.33.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.33.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.33.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.33.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.33.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.33.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.34.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.34.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.34.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.34.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.34.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.34.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.35.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.35.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.35.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.35.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.35.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.35.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.36.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.36.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.36.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.36.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.36.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.36.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.37.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.37.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.37.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.37.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.37.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.37.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.38.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.38.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.38.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.38.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.38.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.38.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.39.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.39.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.39.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.39.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.39.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.39.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.4.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.4.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.4.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.4.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.4.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.4.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.40.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.40.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.40.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.40.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.40.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.40.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.41.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.41.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.41.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.41.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.41.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.41.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.42.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.42.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.42.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.42.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.42.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.42.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.43.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.43.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.43.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.43.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.43.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.43.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.44.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.44.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.44.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.44.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.44.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.44.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.45.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.45.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.45.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.45.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.45.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.45.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.46.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.46.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.46.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.46.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.46.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.46.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.47.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.47.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.47.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.47.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.47.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.47.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.48.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.48.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.48.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.48.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.48.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.48.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.49.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.49.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.49.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.49.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.49.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.49.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.5.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.5.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.5.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.5.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.5.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.5.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.50.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.50.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.50.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.50.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.50.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.50.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.51.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.51.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.51.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.51.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.51.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.51.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.52.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.52.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.52.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.52.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.52.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.52.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.53.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.53.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.53.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.53.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.53.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.53.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.54.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.54.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.54.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.54.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.54.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.54.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.55.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.55.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.55.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.55.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.55.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.55.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.56.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.56.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.56.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.56.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.56.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.56.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.57.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.57.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.57.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.57.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.57.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.57.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.58.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.58.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.58.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.58.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.58.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.58.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.59.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.59.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.59.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.59.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.59.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.59.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.6.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.6.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.6.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.6.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.6.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.6.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.60.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.60.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.60.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.60.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.60.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.60.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.61.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.61.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.61.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.61.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.61.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.61.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.62.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.62.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.62.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.62.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.62.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.62.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.63.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.63.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.63.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.63.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.63.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.63.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.64.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.64.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.64.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.64.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.64.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.64.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.65.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.65.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.65.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.65.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.65.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.65.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.66.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.66.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.66.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.66.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.66.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.66.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.67.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.67.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.67.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.67.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.67.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.67.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.68.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.68.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.68.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.68.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.68.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.68.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.69.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.69.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.69.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.69.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.69.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.69.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.7.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.7.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.7.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.7.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.7.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.7.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.70.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.70.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.70.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.70.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.70.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.70.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.71.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.71.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.71.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.71.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.71.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.71.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.72.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.72.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.72.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.72.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.72.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.72.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.73.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.73.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.73.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.73.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.73.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.73.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.74.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.74.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.74.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.74.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.74.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.74.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.75.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.75.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.75.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.75.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.75.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.75.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.76.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.76.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.76.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.76.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.76.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.76.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.77.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.77.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.77.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.77.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.77.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.77.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.78.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.78.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.78.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.78.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.78.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.78.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.79.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.79.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.79.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.79.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.79.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.79.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.8.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.8.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.8.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.8.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.8.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.8.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.80.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.80.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.80.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.80.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.80.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.80.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.81.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.81.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.81.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.81.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.81.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.81.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.82.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.82.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.82.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.82.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.82.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.82.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.83.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.83.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.83.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.83.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.83.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.83.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.84.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.84.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.84.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.84.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.84.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.84.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.85.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.85.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.85.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.85.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.85.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.85.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.86.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.86.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.86.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.86.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.86.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.86.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.87.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.87.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.87.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.87.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.87.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.87.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.88.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.88.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.88.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.88.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.88.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.88.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.89.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.89.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.89.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.89.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.89.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.89.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.9.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.9.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.9.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.9.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.9.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.9.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.90.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.90.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.90.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.90.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.90.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.90.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.91.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.91.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.91.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.91.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.91.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.91.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.92.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.92.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.92.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.92.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.92.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.92.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.93.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.93.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.93.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.93.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.93.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.93.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.94.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.94.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.94.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.94.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.94.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.94.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.95.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.95.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.95.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.95.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.95.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.95.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.96.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.96.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.96.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.96.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.96.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.96.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.97.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.97.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.97.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.97.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.97.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.97.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.98.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.98.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.98.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.98.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.98.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.98.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.99.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.99.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.99.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.99.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.99.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.experts.99.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.gate.e_score_correction_bias": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.gate.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.shared_experts.down_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.shared_experts.down_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.shared_experts.gate_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.shared_experts.gate_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.shared_experts.up_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.mlp.shared_experts.up_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.post_attention_layernorm.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.self_attn.k_norm.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.self_attn.k_proj.bias": "model-00026-of-00092.safetensors",
+ "model.layers.25.self_attn.k_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.self_attn.k_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.self_attn.o_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.self_attn.o_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.self_attn.q_norm.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.self_attn.q_proj.bias": "model-00026-of-00092.safetensors",
+ "model.layers.25.self_attn.q_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.self_attn.q_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.25.self_attn.v_proj.bias": "model-00026-of-00092.safetensors",
+ "model.layers.25.self_attn.v_proj.weight": "model-00026-of-00092.safetensors",
+ "model.layers.25.self_attn.v_proj.weight_scale": "model-00026-of-00092.safetensors",
+ "model.layers.26.input_layernorm.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.0.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.0.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.0.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.0.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.0.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.0.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.1.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.1.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.1.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.1.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.1.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.1.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.10.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.10.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.10.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.10.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.10.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.10.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.100.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.100.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.100.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.100.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.100.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.100.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.101.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.101.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.101.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.101.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.101.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.101.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.102.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.102.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.102.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.102.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.102.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.102.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.103.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.103.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.103.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.103.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.103.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.103.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.104.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.104.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.104.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.104.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.104.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.104.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.105.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.105.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.105.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.105.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.105.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.105.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.106.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.106.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.106.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.106.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.106.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.106.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.107.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.107.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.107.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.107.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.107.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.107.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.108.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.108.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.108.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.108.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.108.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.108.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.109.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.109.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.109.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.109.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.109.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.109.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.11.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.11.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.11.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.11.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.11.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.11.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.110.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.110.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.110.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.110.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.110.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.110.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.111.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.111.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.111.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.111.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.111.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.111.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.112.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.112.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.112.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.112.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.112.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.112.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.113.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.113.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.113.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.113.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.113.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.113.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.114.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.114.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.114.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.114.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.114.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.114.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.115.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.115.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.115.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.115.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.115.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.115.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.116.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.116.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.116.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.116.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.116.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.116.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.117.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.117.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.117.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.117.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.117.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.117.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.118.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.118.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.118.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.118.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.118.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.118.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.119.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.119.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.119.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.119.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.119.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.119.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.12.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.12.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.12.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.12.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.12.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.12.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.120.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.120.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.120.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.120.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.120.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.120.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.121.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.121.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.121.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.121.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.121.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.121.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.122.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.122.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.122.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.122.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.122.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.122.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.123.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.123.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.123.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.123.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.123.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.123.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.124.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.124.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.124.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.124.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.124.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.124.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.125.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.125.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.125.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.125.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.125.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.125.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.126.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.126.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.126.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.126.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.126.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.126.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.127.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.127.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.127.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.127.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.127.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.127.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.128.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.128.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.128.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.128.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.128.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.128.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.129.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.129.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.129.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.129.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.129.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.129.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.13.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.13.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.13.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.13.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.13.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.13.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.130.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.130.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.130.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.130.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.130.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.130.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.131.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.131.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.131.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.131.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.131.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.131.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.132.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.132.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.132.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.132.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.132.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.132.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.133.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.133.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.133.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.133.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.133.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.133.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.134.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.134.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.134.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.134.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.134.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.134.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.135.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.135.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.135.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.135.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.135.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.135.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.136.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.136.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.136.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.136.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.136.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.136.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.137.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.137.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.137.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.137.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.137.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.137.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.138.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.138.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.138.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.138.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.138.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.138.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.139.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.139.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.139.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.139.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.139.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.139.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.14.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.14.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.14.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.14.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.14.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.14.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.140.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.140.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.140.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.140.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.140.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.140.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.141.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.141.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.141.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.141.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.141.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.141.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.142.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.142.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.142.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.142.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.142.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.142.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.143.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.143.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.143.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.143.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.143.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.143.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.144.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.144.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.144.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.144.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.144.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.144.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.145.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.145.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.145.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.145.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.145.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.145.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.146.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.146.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.146.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.146.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.146.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.146.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.147.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.147.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.147.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.147.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.147.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.147.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.148.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.148.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.148.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.148.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.148.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.148.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.149.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.149.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.149.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.149.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.149.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.149.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.15.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.15.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.15.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.15.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.15.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.15.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.150.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.150.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.150.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.150.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.150.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.150.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.151.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.151.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.151.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.151.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.151.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.151.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.152.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.152.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.152.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.152.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.152.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.152.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.153.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.153.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.153.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.153.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.153.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.153.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.154.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.154.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.154.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.154.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.154.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.154.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.155.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.155.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.155.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.155.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.155.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.155.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.156.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.156.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.156.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.156.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.156.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.156.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.157.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.157.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.157.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.157.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.157.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.157.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.158.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.158.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.158.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.158.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.158.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.158.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.159.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.159.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.159.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.159.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.159.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.159.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.16.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.16.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.16.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.16.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.16.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.16.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.17.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.17.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.17.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.17.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.17.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.17.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.18.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.18.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.18.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.18.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.18.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.18.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.19.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.19.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.19.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.19.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.19.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.19.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.2.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.2.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.2.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.2.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.2.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.2.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.20.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.20.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.20.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.20.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.20.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.20.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.21.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.21.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.21.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.21.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.21.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.21.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.22.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.22.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.22.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.22.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.22.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.22.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.23.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.23.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.23.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.23.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.23.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.23.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.24.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.24.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.24.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.24.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.24.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.24.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.25.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.25.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.25.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.25.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.25.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.25.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.26.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.26.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.26.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.26.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.26.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.26.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.27.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.27.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.27.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.27.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.27.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.27.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.28.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.28.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.28.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.28.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.28.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.28.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.29.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.29.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.29.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.29.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.29.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.29.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.3.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.3.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.3.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.3.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.3.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.3.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.30.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.30.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.30.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.30.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.30.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.30.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.31.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.31.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.31.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.31.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.31.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.31.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.32.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.32.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.32.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.32.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.32.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.32.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.33.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.33.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.33.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.33.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.33.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.33.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.34.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.34.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.34.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.34.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.34.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.34.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.35.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.35.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.35.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.35.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.35.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.35.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.36.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.36.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.36.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.36.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.36.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.36.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.37.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.37.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.37.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.37.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.37.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.37.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.38.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.38.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.38.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.38.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.38.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.38.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.39.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.39.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.39.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.39.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.39.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.39.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.4.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.4.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.4.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.4.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.4.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.4.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.40.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.40.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.40.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.40.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.40.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.40.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.41.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.41.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.41.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.41.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.41.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.41.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.42.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.42.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.42.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.42.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.42.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.42.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.43.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.43.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.43.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.43.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.43.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.43.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.44.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.44.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.44.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.44.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.44.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.44.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.45.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.45.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.45.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.45.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.45.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.45.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.46.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.46.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.46.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.46.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.46.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.46.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.47.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.47.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.47.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.47.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.47.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.47.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.48.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.48.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.48.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.48.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.48.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.48.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.49.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.49.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.49.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.49.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.49.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.49.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.5.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.5.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.5.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.5.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.5.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.5.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.50.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.50.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.50.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.50.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.50.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.50.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.51.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.51.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.51.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.51.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.51.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.51.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.52.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.52.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.52.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.52.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.52.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.52.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.53.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.53.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.53.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.53.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.53.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.53.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.54.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.54.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.54.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.54.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.54.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.54.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.55.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.55.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.55.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.55.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.55.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.55.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.56.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.56.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.56.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.56.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.56.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.56.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.57.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.57.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.57.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.57.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.57.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.57.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.58.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.58.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.58.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.58.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.58.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.58.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.59.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.59.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.59.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.59.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.59.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.59.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.6.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.6.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.6.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.6.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.6.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.6.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.60.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.60.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.60.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.60.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.60.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.60.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.61.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.61.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.61.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.61.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.61.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.61.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.62.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.62.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.62.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.62.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.62.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.62.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.63.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.63.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.63.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.63.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.63.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.63.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.64.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.64.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.64.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.64.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.64.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.64.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.65.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.65.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.65.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.65.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.65.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.65.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.66.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.66.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.66.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.66.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.66.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.66.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.67.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.67.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.67.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.67.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.67.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.67.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.68.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.68.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.68.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.68.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.68.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.68.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.69.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.69.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.69.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.69.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.69.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.69.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.7.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.7.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.7.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.7.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.7.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.7.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.70.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.70.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.70.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.70.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.70.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.70.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.71.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.71.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.71.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.71.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.71.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.71.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.72.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.72.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.72.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.72.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.72.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.72.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.73.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.73.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.73.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.73.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.73.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.73.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.74.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.74.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.74.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.74.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.74.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.74.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.75.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.75.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.75.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.75.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.75.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.75.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.76.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.76.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.76.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.76.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.76.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.76.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.77.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.77.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.77.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.77.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.77.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.77.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.78.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.78.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.78.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.78.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.78.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.78.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.79.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.79.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.79.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.79.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.79.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.79.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.8.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.8.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.8.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.8.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.8.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.8.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.80.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.80.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.80.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.80.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.80.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.80.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.81.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.81.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.81.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.81.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.81.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.81.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.82.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.82.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.82.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.82.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.82.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.82.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.83.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.83.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.83.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.83.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.83.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.83.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.84.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.84.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.84.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.84.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.84.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.84.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.85.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.85.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.85.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.85.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.85.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.85.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.86.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.86.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.86.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.86.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.86.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.86.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.87.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.87.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.87.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.87.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.87.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.87.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.88.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.88.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.88.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.88.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.88.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.88.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.89.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.89.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.89.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.89.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.89.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.89.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.9.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.9.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.9.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.9.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.9.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.9.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.90.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.90.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.90.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.90.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.90.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.90.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.91.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.91.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.91.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.91.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.91.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.91.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.92.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.92.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.92.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.92.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.92.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.92.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.93.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.93.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.93.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.93.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.93.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.93.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.94.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.94.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.94.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.94.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.94.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.94.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.95.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.95.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.95.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.95.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.95.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.95.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.96.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.96.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.96.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.96.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.96.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.96.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.97.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.97.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.97.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.97.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.97.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.97.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.98.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.98.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.98.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.98.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.98.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.98.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.99.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.99.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.99.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.99.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.99.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.experts.99.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.gate.e_score_correction_bias": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.gate.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.shared_experts.down_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.shared_experts.down_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.shared_experts.gate_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.shared_experts.gate_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.shared_experts.up_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.mlp.shared_experts.up_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.post_attention_layernorm.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.self_attn.k_norm.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.self_attn.k_proj.bias": "model-00027-of-00092.safetensors",
+ "model.layers.26.self_attn.k_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.self_attn.k_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.self_attn.o_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.self_attn.o_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.self_attn.q_norm.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.self_attn.q_proj.bias": "model-00027-of-00092.safetensors",
+ "model.layers.26.self_attn.q_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.self_attn.q_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.26.self_attn.v_proj.bias": "model-00027-of-00092.safetensors",
+ "model.layers.26.self_attn.v_proj.weight": "model-00027-of-00092.safetensors",
+ "model.layers.26.self_attn.v_proj.weight_scale": "model-00027-of-00092.safetensors",
+ "model.layers.27.input_layernorm.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.0.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.0.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.0.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.0.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.0.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.0.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.1.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.1.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.1.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.1.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.1.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.1.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.10.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.10.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.10.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.10.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.10.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.10.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.100.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.100.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.100.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.100.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.100.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.100.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.101.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.101.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.101.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.101.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.101.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.101.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.102.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.102.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.102.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.102.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.102.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.102.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.103.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.103.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.103.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.103.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.103.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.103.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.104.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.104.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.104.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.104.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.104.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.104.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.105.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.105.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.105.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.105.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.105.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.105.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.106.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.106.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.106.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.106.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.106.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.106.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.107.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.107.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.107.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.107.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.107.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.107.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.108.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.108.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.108.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.108.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.108.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.108.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.109.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.109.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.109.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.109.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.109.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.109.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.11.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.11.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.11.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.11.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.11.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.11.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.110.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.110.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.110.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.110.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.110.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.110.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.111.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.111.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.111.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.111.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.111.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.111.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.112.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.112.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.112.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.112.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.112.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.112.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.113.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.113.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.113.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.113.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.113.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.113.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.114.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.114.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.114.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.114.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.114.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.114.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.115.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.115.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.115.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.115.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.115.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.115.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.116.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.116.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.116.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.116.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.116.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.116.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.117.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.117.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.117.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.117.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.117.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.117.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.118.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.118.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.118.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.118.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.118.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.118.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.119.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.119.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.119.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.119.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.119.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.119.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.12.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.12.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.12.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.12.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.12.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.12.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.120.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.120.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.120.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.120.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.120.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.120.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.121.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.121.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.121.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.121.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.121.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.121.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.122.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.122.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.122.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.122.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.122.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.122.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.123.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.123.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.123.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.123.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.123.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.123.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.124.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.124.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.124.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.124.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.124.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.124.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.125.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.125.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.125.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.125.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.125.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.125.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.126.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.126.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.126.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.126.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.126.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.126.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.127.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.127.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.127.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.127.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.127.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.127.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.128.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.128.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.128.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.128.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.128.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.128.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.129.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.129.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.129.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.129.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.129.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.129.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.13.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.13.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.13.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.13.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.13.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.13.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.130.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.130.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.130.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.130.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.130.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.130.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.131.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.131.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.131.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.131.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.131.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.131.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.132.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.132.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.132.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.132.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.132.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.132.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.133.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.133.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.133.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.133.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.133.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.133.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.134.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.134.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.134.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.134.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.134.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.134.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.135.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.135.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.135.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.135.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.135.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.135.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.136.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.136.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.136.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.136.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.136.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.136.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.137.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.137.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.137.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.137.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.137.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.137.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.138.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.138.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.138.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.138.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.138.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.138.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.139.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.139.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.139.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.139.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.139.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.139.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.14.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.14.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.14.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.14.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.14.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.14.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.140.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.140.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.140.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.140.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.140.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.140.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.141.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.141.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.141.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.141.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.141.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.141.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.142.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.142.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.142.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.142.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.142.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.142.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.143.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.143.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.143.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.143.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.143.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.143.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.144.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.144.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.144.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.144.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.144.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.144.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.145.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.145.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.145.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.145.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.145.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.145.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.146.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.146.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.146.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.146.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.146.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.146.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.147.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.147.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.147.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.147.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.147.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.147.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.148.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.148.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.148.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.148.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.148.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.148.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.149.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.149.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.149.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.149.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.149.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.149.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.15.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.15.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.15.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.15.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.15.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.15.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.150.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.150.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.150.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.150.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.150.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.150.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.151.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.151.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.151.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.151.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.151.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.151.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.152.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.152.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.152.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.152.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.152.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.152.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.153.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.153.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.153.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.153.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.153.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.153.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.154.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.154.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.154.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.154.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.154.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.154.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.155.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.155.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.155.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.155.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.155.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.155.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.156.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.156.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.156.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.156.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.156.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.156.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.157.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.157.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.157.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.157.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.157.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.157.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.158.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.158.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.158.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.158.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.158.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.158.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.159.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.159.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.159.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.159.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.159.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.159.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.16.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.16.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.16.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.16.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.16.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.16.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.17.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.17.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.17.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.17.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.17.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.17.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.18.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.18.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.18.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.18.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.18.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.18.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.19.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.19.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.19.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.19.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.19.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.19.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.2.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.2.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.2.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.2.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.2.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.2.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.20.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.20.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.20.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.20.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.20.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.20.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.21.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.21.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.21.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.21.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.21.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.21.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.22.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.22.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.22.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.22.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.22.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.22.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.23.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.23.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.23.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.23.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.23.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.23.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.24.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.24.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.24.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.24.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.24.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.24.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.25.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.25.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.25.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.25.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.25.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.25.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.26.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.26.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.26.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.26.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.26.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.26.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.27.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.27.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.27.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.27.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.27.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.27.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.28.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.28.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.28.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.28.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.28.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.28.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.29.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.29.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.29.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.29.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.29.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.29.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.3.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.3.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.3.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.3.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.3.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.3.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.30.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.30.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.30.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.30.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.30.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.30.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.31.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.31.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.31.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.31.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.31.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.31.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.32.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.32.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.32.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.32.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.32.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.32.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.33.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.33.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.33.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.33.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.33.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.33.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.34.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.34.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.34.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.34.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.34.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.34.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.35.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.35.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.35.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.35.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.35.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.35.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.36.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.36.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.36.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.36.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.36.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.36.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.37.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.37.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.37.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.37.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.37.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.37.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.38.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.38.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.38.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.38.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.38.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.38.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.39.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.39.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.39.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.39.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.39.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.39.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.4.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.4.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.4.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.4.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.4.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.4.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.40.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.40.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.40.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.40.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.40.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.40.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.41.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.41.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.41.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.41.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.41.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.41.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.42.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.42.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.42.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.42.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.42.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.42.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.43.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.43.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.43.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.43.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.43.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.43.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.44.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.44.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.44.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.44.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.44.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.44.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.45.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.45.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.45.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.45.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.45.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.45.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.46.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.46.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.46.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.46.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.46.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.46.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.47.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.47.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.47.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.47.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.47.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.47.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.48.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.48.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.48.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.48.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.48.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.48.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.49.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.49.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.49.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.49.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.49.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.49.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.5.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.5.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.5.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.5.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.5.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.5.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.50.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.50.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.50.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.50.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.50.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.50.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.51.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.51.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.51.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.51.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.51.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.51.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.52.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.52.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.52.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.52.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.52.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.52.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.53.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.53.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.53.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.53.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.53.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.53.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.54.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.54.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.54.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.54.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.54.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.54.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.55.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.55.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.55.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.55.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.55.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.55.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.56.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.56.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.56.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.56.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.56.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.56.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.57.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.57.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.57.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.57.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.57.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.57.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.58.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.58.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.58.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.58.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.58.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.58.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.59.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.59.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.59.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.59.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.59.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.59.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.6.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.6.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.6.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.6.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.6.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.6.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.60.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.60.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.60.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.60.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.60.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.60.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.61.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.61.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.61.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.61.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.61.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.61.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.62.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.62.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.62.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.62.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.62.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.62.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.63.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.63.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.63.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.63.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.63.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.63.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.64.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.64.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.64.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.64.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.64.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.64.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.65.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.65.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.65.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.65.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.65.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.65.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.66.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.66.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.66.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.66.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.66.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.66.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.67.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.67.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.67.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.67.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.67.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.67.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.68.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.68.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.68.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.68.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.68.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.68.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.69.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.69.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.69.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.69.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.69.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.69.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.7.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.7.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.7.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.7.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.7.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.7.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.70.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.70.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.70.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.70.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.70.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.70.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.71.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.71.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.71.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.71.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.71.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.71.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.72.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.72.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.72.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.72.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.72.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.72.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.73.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.73.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.73.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.73.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.73.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.73.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.74.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.74.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.74.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.74.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.74.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.74.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.75.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.75.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.75.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.75.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.75.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.75.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.76.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.76.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.76.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.76.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.76.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.76.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.77.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.77.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.77.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.77.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.77.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.77.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.78.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.78.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.78.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.78.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.78.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.78.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.79.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.79.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.79.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.79.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.79.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.79.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.8.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.8.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.8.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.8.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.8.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.8.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.80.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.80.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.80.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.80.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.80.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.80.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.81.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.81.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.81.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.81.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.81.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.81.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.82.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.82.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.82.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.82.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.82.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.82.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.83.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.83.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.83.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.83.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.83.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.83.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.84.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.84.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.84.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.84.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.84.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.84.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.85.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.85.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.85.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.85.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.85.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.85.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.86.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.86.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.86.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.86.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.86.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.86.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.87.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.87.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.87.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.87.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.87.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.87.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.88.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.88.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.88.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.88.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.88.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.88.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.89.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.89.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.89.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.89.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.89.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.89.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.9.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.9.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.9.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.9.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.9.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.9.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.90.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.90.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.90.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.90.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.90.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.90.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.91.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.91.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.91.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.91.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.91.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.91.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.92.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.92.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.92.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.92.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.92.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.92.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.93.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.93.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.93.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.93.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.93.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.93.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.94.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.94.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.94.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.94.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.94.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.94.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.95.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.95.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.95.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.95.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.95.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.95.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.96.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.96.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.96.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.96.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.96.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.96.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.97.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.97.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.97.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.97.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.97.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.97.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.98.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.98.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.98.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.98.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.98.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.98.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.99.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.99.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.99.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.99.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.99.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.experts.99.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.gate.e_score_correction_bias": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.gate.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.shared_experts.down_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.shared_experts.down_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.shared_experts.gate_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.shared_experts.gate_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.shared_experts.up_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.mlp.shared_experts.up_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.post_attention_layernorm.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.self_attn.k_norm.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.self_attn.k_proj.bias": "model-00028-of-00092.safetensors",
+ "model.layers.27.self_attn.k_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.self_attn.k_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.self_attn.o_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.self_attn.o_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.self_attn.q_norm.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.self_attn.q_proj.bias": "model-00028-of-00092.safetensors",
+ "model.layers.27.self_attn.q_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.self_attn.q_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.27.self_attn.v_proj.bias": "model-00028-of-00092.safetensors",
+ "model.layers.27.self_attn.v_proj.weight": "model-00028-of-00092.safetensors",
+ "model.layers.27.self_attn.v_proj.weight_scale": "model-00028-of-00092.safetensors",
+ "model.layers.28.input_layernorm.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.0.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.0.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.0.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.0.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.0.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.0.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.1.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.1.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.1.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.1.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.1.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.1.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.10.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.10.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.10.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.10.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.10.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.10.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.100.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.100.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.100.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.100.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.100.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.100.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.101.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.101.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.101.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.101.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.101.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.101.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.102.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.102.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.102.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.102.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.102.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.102.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.103.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.103.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.103.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.103.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.103.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.103.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.104.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.104.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.104.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.104.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.104.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.104.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.105.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.105.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.105.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.105.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.105.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.105.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.106.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.106.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.106.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.106.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.106.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.106.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.107.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.107.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.107.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.107.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.107.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.107.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.108.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.108.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.108.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.108.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.108.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.108.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.109.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.109.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.109.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.109.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.109.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.109.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.11.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.11.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.11.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.11.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.11.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.11.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.110.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.110.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.110.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.110.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.110.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.110.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.111.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.111.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.111.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.111.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.111.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.111.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.112.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.112.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.112.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.112.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.112.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.112.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.113.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.113.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.113.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.113.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.113.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.113.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.114.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.114.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.114.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.114.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.114.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.114.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.115.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.115.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.115.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.115.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.115.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.115.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.116.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.116.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.116.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.116.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.116.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.116.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.117.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.117.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.117.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.117.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.117.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.117.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.118.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.118.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.118.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.118.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.118.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.118.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.119.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.119.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.119.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.119.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.119.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.119.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.12.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.12.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.12.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.12.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.12.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.12.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.120.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.120.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.120.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.120.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.120.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.120.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.121.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.121.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.121.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.121.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.121.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.121.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.122.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.122.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.122.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.122.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.122.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.122.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.123.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.123.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.123.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.123.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.123.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.123.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.124.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.124.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.124.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.124.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.124.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.124.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.125.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.125.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.125.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.125.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.125.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.125.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.126.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.126.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.126.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.126.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.126.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.126.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.127.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.127.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.127.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.127.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.127.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.127.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.128.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.128.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.128.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.128.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.128.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.128.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.129.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.129.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.129.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.129.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.129.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.129.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.13.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.13.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.13.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.13.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.13.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.13.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.130.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.130.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.130.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.130.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.130.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.130.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.131.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.131.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.131.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.131.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.131.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.131.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.132.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.132.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.132.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.132.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.132.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.132.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.133.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.133.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.133.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.133.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.133.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.133.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.134.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.134.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.134.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.134.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.134.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.134.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.135.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.135.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.135.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.135.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.135.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.135.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.136.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.136.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.136.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.136.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.136.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.136.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.137.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.137.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.137.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.137.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.137.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.137.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.138.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.138.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.138.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.138.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.138.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.138.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.139.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.139.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.139.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.139.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.139.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.139.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.14.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.14.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.14.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.14.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.14.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.14.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.140.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.140.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.140.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.140.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.140.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.140.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.141.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.141.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.141.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.141.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.141.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.141.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.142.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.142.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.142.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.142.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.142.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.142.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.143.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.143.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.143.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.143.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.143.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.143.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.144.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.144.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.144.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.144.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.144.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.144.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.145.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.145.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.145.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.145.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.145.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.145.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.146.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.146.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.146.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.146.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.146.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.146.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.147.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.147.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.147.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.147.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.147.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.147.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.148.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.148.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.148.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.148.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.148.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.148.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.149.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.149.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.149.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.149.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.149.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.149.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.15.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.15.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.15.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.15.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.15.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.15.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.150.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.150.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.150.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.150.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.150.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.150.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.151.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.151.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.151.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.151.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.151.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.151.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.152.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.152.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.152.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.152.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.152.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.152.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.153.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.153.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.153.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.153.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.153.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.153.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.154.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.154.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.154.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.154.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.154.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.154.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.155.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.155.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.155.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.155.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.155.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.155.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.156.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.156.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.156.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.156.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.156.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.156.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.157.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.157.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.157.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.157.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.157.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.157.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.158.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.158.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.158.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.158.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.158.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.158.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.159.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.159.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.159.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.159.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.159.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.159.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.16.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.16.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.16.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.16.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.16.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.16.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.17.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.17.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.17.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.17.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.17.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.17.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.18.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.18.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.18.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.18.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.18.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.18.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.19.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.19.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.19.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.19.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.19.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.19.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.2.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.2.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.2.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.2.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.2.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.2.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.20.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.20.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.20.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.20.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.20.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.20.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.21.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.21.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.21.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.21.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.21.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.21.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.22.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.22.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.22.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.22.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.22.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.22.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.23.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.23.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.23.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.23.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.23.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.23.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.24.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.24.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.24.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.24.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.24.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.24.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.25.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.25.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.25.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.25.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.25.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.25.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.26.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.26.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.26.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.26.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.26.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.26.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.27.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.27.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.27.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.27.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.27.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.27.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.28.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.28.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.28.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.28.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.28.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.28.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.29.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.29.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.29.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.29.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.29.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.29.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.3.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.3.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.3.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.3.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.3.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.3.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.30.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.30.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.30.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.30.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.30.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.30.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.31.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.31.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.31.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.31.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.31.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.31.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.32.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.32.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.32.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.32.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.32.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.32.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.33.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.33.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.33.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.33.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.33.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.33.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.34.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.34.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.34.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.34.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.34.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.34.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.35.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.35.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.35.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.35.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.35.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.35.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.36.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.36.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.36.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.36.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.36.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.36.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.37.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.37.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.37.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.37.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.37.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.37.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.38.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.38.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.38.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.38.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.38.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.38.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.39.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.39.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.39.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.39.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.39.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.39.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.4.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.4.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.4.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.4.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.4.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.4.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.40.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.40.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.40.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.40.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.40.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.40.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.41.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.41.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.41.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.41.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.41.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.41.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.42.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.42.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.42.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.42.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.42.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.42.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.43.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.43.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.43.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.43.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.43.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.43.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.44.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.44.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.44.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.44.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.44.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.44.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.45.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.45.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.45.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.45.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.45.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.45.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.46.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.46.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.46.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.46.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.46.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.46.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.47.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.47.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.47.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.47.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.47.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.47.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.48.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.48.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.48.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.48.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.48.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.48.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.49.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.49.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.49.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.49.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.49.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.49.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.5.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.5.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.5.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.5.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.5.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.5.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.50.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.50.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.50.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.50.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.50.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.50.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.51.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.51.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.51.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.51.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.51.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.51.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.52.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.52.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.52.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.52.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.52.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.52.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.53.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.53.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.53.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.53.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.53.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.53.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.54.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.54.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.54.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.54.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.54.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.54.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.55.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.55.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.55.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.55.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.55.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.55.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.56.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.56.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.56.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.56.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.56.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.56.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.57.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.57.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.57.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.57.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.57.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.57.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.58.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.58.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.58.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.58.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.58.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.58.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.59.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.59.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.59.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.59.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.59.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.59.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.6.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.6.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.6.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.6.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.6.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.6.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.60.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.60.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.60.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.60.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.60.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.60.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.61.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.61.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.61.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.61.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.61.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.61.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.62.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.62.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.62.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.62.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.62.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.62.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.63.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.63.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.63.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.63.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.63.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.63.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.64.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.64.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.64.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.64.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.64.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.64.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.65.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.65.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.65.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.65.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.65.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.65.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.66.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.66.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.66.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.66.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.66.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.66.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.67.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.67.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.67.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.67.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.67.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.67.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.68.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.68.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.68.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.68.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.68.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.68.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.69.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.69.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.69.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.69.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.69.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.69.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.7.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.7.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.7.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.7.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.7.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.7.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.70.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.70.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.70.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.70.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.70.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.70.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.71.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.71.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.71.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.71.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.71.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.71.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.72.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.72.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.72.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.72.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.72.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.72.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.73.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.73.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.73.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.73.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.73.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.73.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.74.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.74.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.74.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.74.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.74.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.74.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.75.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.75.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.75.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.75.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.75.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.75.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.76.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.76.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.76.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.76.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.76.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.76.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.77.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.77.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.77.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.77.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.77.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.77.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.78.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.78.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.78.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.78.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.78.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.78.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.79.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.79.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.79.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.79.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.79.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.79.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.8.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.8.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.8.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.8.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.8.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.8.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.80.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.80.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.80.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.80.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.80.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.80.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.81.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.81.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.81.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.81.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.81.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.81.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.82.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.82.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.82.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.82.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.82.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.82.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.83.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.83.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.83.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.83.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.83.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.83.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.84.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.84.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.84.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.84.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.84.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.84.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.85.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.85.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.85.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.85.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.85.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.85.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.86.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.86.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.86.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.86.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.86.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.86.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.87.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.87.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.87.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.87.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.87.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.87.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.88.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.88.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.88.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.88.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.88.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.88.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.89.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.89.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.89.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.89.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.89.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.89.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.9.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.9.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.9.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.9.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.9.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.9.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.90.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.90.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.90.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.90.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.90.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.90.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.91.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.91.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.91.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.91.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.91.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.91.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.92.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.92.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.92.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.92.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.92.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.92.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.93.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.93.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.93.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.93.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.93.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.93.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.94.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.94.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.94.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.94.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.94.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.94.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.95.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.95.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.95.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.95.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.95.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.95.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.96.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.96.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.96.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.96.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.96.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.96.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.97.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.97.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.97.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.97.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.97.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.97.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.98.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.98.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.98.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.98.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.98.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.98.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.99.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.99.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.99.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.99.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.99.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.experts.99.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.gate.e_score_correction_bias": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.gate.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.shared_experts.down_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.shared_experts.down_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.shared_experts.gate_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.shared_experts.gate_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.shared_experts.up_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.mlp.shared_experts.up_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.post_attention_layernorm.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.self_attn.k_norm.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.self_attn.k_proj.bias": "model-00029-of-00092.safetensors",
+ "model.layers.28.self_attn.k_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.self_attn.k_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.self_attn.o_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.self_attn.o_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.self_attn.q_norm.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.self_attn.q_proj.bias": "model-00029-of-00092.safetensors",
+ "model.layers.28.self_attn.q_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.self_attn.q_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.28.self_attn.v_proj.bias": "model-00029-of-00092.safetensors",
+ "model.layers.28.self_attn.v_proj.weight": "model-00029-of-00092.safetensors",
+ "model.layers.28.self_attn.v_proj.weight_scale": "model-00029-of-00092.safetensors",
+ "model.layers.29.input_layernorm.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.0.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.0.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.0.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.0.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.0.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.0.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.1.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.1.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.1.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.1.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.1.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.1.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.10.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.10.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.10.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.10.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.10.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.10.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.100.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.100.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.100.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.100.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.100.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.100.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.101.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.101.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.101.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.101.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.101.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.101.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.102.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.102.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.102.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.102.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.102.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.102.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.103.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.103.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.103.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.103.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.103.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.103.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.104.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.104.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.104.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.104.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.104.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.104.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.105.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.105.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.105.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.105.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.105.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.105.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.106.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.106.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.106.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.106.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.106.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.106.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.107.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.107.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.107.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.107.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.107.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.107.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.108.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.108.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.108.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.108.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.108.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.108.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.109.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.109.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.109.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.109.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.109.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.109.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.11.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.11.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.11.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.11.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.11.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.11.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.110.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.110.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.110.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.110.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.110.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.110.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.111.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.111.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.111.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.111.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.111.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.111.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.112.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.112.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.112.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.112.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.112.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.112.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.113.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.113.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.113.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.113.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.113.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.113.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.114.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.114.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.114.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.114.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.114.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.114.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.115.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.115.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.115.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.115.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.115.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.115.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.116.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.116.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.116.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.116.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.116.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.116.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.117.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.117.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.117.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.117.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.117.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.117.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.118.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.118.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.118.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.118.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.118.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.118.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.119.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.119.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.119.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.119.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.119.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.119.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.12.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.12.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.12.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.12.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.12.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.12.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.120.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.120.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.120.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.120.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.120.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.120.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.121.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.121.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.121.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.121.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.121.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.121.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.122.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.122.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.122.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.122.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.122.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.122.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.123.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.123.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.123.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.123.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.123.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.123.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.124.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.124.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.124.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.124.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.124.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.124.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.125.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.125.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.125.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.125.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.125.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.125.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.126.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.126.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.126.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.126.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.126.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.126.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.127.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.127.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.127.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.127.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.127.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.127.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.128.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.128.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.128.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.128.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.128.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.128.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.129.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.129.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.129.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.129.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.129.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.129.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.13.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.13.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.13.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.13.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.13.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.13.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.130.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.130.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.130.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.130.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.130.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.130.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.131.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.131.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.131.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.131.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.131.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.131.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.132.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.132.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.132.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.132.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.132.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.132.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.133.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.133.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.133.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.133.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.133.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.133.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.134.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.134.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.134.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.134.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.134.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.134.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.135.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.135.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.135.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.135.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.135.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.135.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.136.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.136.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.136.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.136.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.136.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.136.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.137.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.137.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.137.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.137.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.137.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.137.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.138.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.138.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.138.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.138.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.138.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.138.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.139.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.139.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.139.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.139.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.139.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.139.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.14.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.14.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.14.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.14.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.14.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.14.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.140.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.140.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.140.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.140.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.140.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.140.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.141.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.141.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.141.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.141.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.141.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.141.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.142.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.142.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.142.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.142.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.142.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.142.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.143.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.143.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.143.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.143.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.143.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.143.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.144.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.144.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.144.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.144.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.144.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.144.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.145.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.145.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.145.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.145.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.145.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.145.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.146.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.146.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.146.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.146.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.146.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.146.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.147.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.147.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.147.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.147.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.147.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.147.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.148.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.148.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.148.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.148.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.148.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.148.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.149.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.149.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.149.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.149.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.149.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.149.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.15.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.15.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.15.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.15.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.15.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.15.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.150.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.150.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.150.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.150.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.150.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.150.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.151.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.151.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.151.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.151.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.151.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.151.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.152.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.152.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.152.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.152.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.152.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.152.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.153.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.153.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.153.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.153.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.153.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.153.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.154.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.154.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.154.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.154.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.154.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.154.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.155.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.155.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.155.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.155.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.155.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.155.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.156.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.156.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.156.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.156.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.156.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.156.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.157.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.157.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.157.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.157.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.157.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.157.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.158.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.158.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.158.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.158.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.158.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.158.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.159.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.159.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.159.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.159.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.159.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.159.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.16.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.16.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.16.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.16.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.16.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.16.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.17.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.17.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.17.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.17.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.17.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.17.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.18.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.18.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.18.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.18.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.18.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.18.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.19.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.19.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.19.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.19.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.19.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.19.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.2.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.2.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.2.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.2.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.2.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.2.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.20.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.20.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.20.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.20.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.20.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.20.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.21.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.21.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.21.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.21.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.21.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.21.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.22.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.22.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.22.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.22.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.22.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.22.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.23.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.23.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.23.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.23.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.23.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.23.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.24.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.24.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.24.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.24.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.24.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.24.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.25.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.25.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.25.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.25.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.25.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.25.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.26.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.26.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.26.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.26.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.26.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.26.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.27.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.27.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.27.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.27.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.27.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.27.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.28.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.28.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.28.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.28.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.28.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.28.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.29.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.29.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.29.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.29.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.29.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.29.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.3.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.3.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.3.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.3.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.3.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.3.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.30.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.30.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.30.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.30.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.30.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.30.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.31.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.31.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.31.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.31.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.31.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.31.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.32.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.32.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.32.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.32.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.32.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.32.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.33.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.33.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.33.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.33.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.33.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.33.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.34.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.34.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.34.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.34.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.34.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.34.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.35.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.35.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.35.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.35.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.35.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.35.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.36.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.36.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.36.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.36.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.36.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.36.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.37.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.37.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.37.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.37.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.37.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.37.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.38.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.38.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.38.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.38.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.38.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.38.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.39.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.39.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.39.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.39.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.39.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.39.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.4.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.4.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.4.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.4.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.4.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.4.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.40.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.40.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.40.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.40.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.40.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.40.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.41.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.41.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.41.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.41.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.41.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.41.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.42.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.42.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.42.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.42.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.42.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.42.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.43.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.43.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.43.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.43.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.43.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.43.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.44.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.44.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.44.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.44.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.44.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.44.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.45.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.45.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.45.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.45.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.45.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.45.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.46.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.46.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.46.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.46.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.46.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.46.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.47.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.47.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.47.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.47.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.47.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.47.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.48.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.48.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.48.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.48.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.48.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.48.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.49.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.49.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.49.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.49.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.49.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.49.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.5.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.5.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.5.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.5.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.5.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.5.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.50.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.50.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.50.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.50.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.50.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.50.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.51.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.51.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.51.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.51.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.51.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.51.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.52.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.52.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.52.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.52.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.52.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.52.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.53.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.53.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.53.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.53.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.53.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.53.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.54.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.54.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.54.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.54.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.54.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.54.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.55.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.55.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.55.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.55.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.55.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.55.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.56.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.56.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.56.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.56.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.56.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.56.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.57.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.57.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.57.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.57.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.57.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.57.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.58.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.58.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.58.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.58.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.58.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.58.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.59.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.59.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.59.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.59.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.59.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.59.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.6.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.6.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.6.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.6.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.6.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.6.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.60.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.60.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.60.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.60.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.60.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.60.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.61.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.61.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.61.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.61.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.61.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.61.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.62.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.62.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.62.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.62.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.62.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.62.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.63.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.63.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.63.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.63.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.63.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.63.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.64.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.64.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.64.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.64.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.64.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.64.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.65.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.65.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.65.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.65.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.65.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.65.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.66.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.66.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.66.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.66.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.66.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.66.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.67.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.67.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.67.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.67.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.67.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.67.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.68.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.68.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.68.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.68.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.68.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.68.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.69.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.69.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.69.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.69.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.69.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.69.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.7.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.7.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.7.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.7.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.7.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.7.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.70.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.70.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.70.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.70.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.70.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.70.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.71.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.71.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.71.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.71.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.71.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.71.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.72.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.72.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.72.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.72.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.72.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.72.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.73.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.73.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.73.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.73.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.73.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.73.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.74.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.74.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.74.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.74.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.74.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.74.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.75.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.75.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.75.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.75.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.75.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.75.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.76.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.76.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.76.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.76.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.76.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.76.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.77.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.77.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.77.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.77.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.77.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.77.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.78.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.78.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.78.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.78.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.78.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.78.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.79.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.79.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.79.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.79.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.79.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.79.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.8.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.8.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.8.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.8.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.8.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.8.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.80.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.80.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.80.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.80.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.80.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.80.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.81.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.81.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.81.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.81.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.81.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.81.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.82.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.82.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.82.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.82.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.82.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.82.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.83.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.83.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.83.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.83.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.83.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.83.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.84.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.84.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.84.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.84.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.84.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.84.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.85.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.85.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.85.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.85.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.85.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.85.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.86.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.86.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.86.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.86.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.86.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.86.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.87.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.87.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.87.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.87.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.87.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.87.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.88.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.88.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.88.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.88.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.88.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.88.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.89.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.89.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.89.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.89.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.89.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.89.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.9.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.9.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.9.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.9.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.9.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.9.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.90.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.90.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.90.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.90.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.90.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.90.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.91.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.91.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.91.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.91.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.91.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.91.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.92.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.92.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.92.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.92.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.92.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.92.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.93.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.93.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.93.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.93.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.93.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.93.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.94.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.94.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.94.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.94.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.94.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.94.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.95.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.95.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.95.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.95.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.95.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.95.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.96.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.96.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.96.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.96.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.96.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.96.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.97.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.97.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.97.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.97.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.97.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.97.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.98.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.98.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.98.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.98.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.98.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.98.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.99.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.99.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.99.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.99.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.99.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.experts.99.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.gate.e_score_correction_bias": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.gate.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.shared_experts.down_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.shared_experts.down_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.shared_experts.gate_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.shared_experts.gate_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.shared_experts.up_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.mlp.shared_experts.up_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.post_attention_layernorm.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.self_attn.k_norm.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.self_attn.k_proj.bias": "model-00030-of-00092.safetensors",
+ "model.layers.29.self_attn.k_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.self_attn.k_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.self_attn.o_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.self_attn.o_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.self_attn.q_norm.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.self_attn.q_proj.bias": "model-00030-of-00092.safetensors",
+ "model.layers.29.self_attn.q_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.self_attn.q_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.29.self_attn.v_proj.bias": "model-00030-of-00092.safetensors",
+ "model.layers.29.self_attn.v_proj.weight": "model-00030-of-00092.safetensors",
+ "model.layers.29.self_attn.v_proj.weight_scale": "model-00030-of-00092.safetensors",
+ "model.layers.3.input_layernorm.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.0.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.0.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.0.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.0.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.0.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.0.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.1.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.1.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.1.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.1.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.1.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.1.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.10.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.10.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.10.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.10.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.10.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.10.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.100.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.100.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.100.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.100.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.100.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.100.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.101.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.101.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.101.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.101.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.101.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.101.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.102.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.102.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.102.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.102.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.102.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.102.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.103.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.103.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.103.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.103.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.103.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.103.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.104.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.104.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.104.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.104.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.104.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.104.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.105.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.105.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.105.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.105.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.105.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.105.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.106.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.106.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.106.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.106.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.106.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.106.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.107.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.107.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.107.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.107.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.107.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.107.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.108.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.108.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.108.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.108.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.108.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.108.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.109.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.109.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.109.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.109.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.109.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.109.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.11.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.11.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.11.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.11.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.11.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.11.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.110.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.110.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.110.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.110.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.110.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.110.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.111.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.111.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.111.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.111.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.111.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.111.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.112.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.112.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.112.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.112.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.112.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.112.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.113.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.113.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.113.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.113.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.113.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.113.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.114.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.114.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.114.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.114.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.114.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.114.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.115.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.115.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.115.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.115.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.115.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.115.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.116.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.116.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.116.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.116.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.116.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.116.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.117.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.117.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.117.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.117.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.117.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.117.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.118.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.118.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.118.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.118.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.118.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.118.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.119.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.119.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.119.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.119.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.119.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.119.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.12.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.12.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.12.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.12.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.12.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.12.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.120.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.120.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.120.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.120.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.120.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.120.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.121.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.121.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.121.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.121.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.121.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.121.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.122.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.122.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.122.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.122.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.122.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.122.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.123.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.123.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.123.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.123.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.123.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.123.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.124.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.124.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.124.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.124.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.124.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.124.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.125.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.125.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.125.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.125.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.125.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.125.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.126.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.126.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.126.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.126.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.126.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.126.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.127.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.127.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.127.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.127.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.127.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.127.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.128.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.128.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.128.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.128.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.128.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.128.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.129.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.129.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.129.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.129.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.129.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.129.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.13.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.13.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.13.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.13.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.13.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.13.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.130.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.130.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.130.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.130.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.130.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.130.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.131.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.131.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.131.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.131.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.131.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.131.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.132.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.132.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.132.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.132.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.132.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.132.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.133.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.133.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.133.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.133.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.133.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.133.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.134.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.134.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.134.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.134.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.134.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.134.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.135.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.135.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.135.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.135.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.135.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.135.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.136.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.136.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.136.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.136.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.136.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.136.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.137.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.137.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.137.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.137.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.137.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.137.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.138.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.138.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.138.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.138.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.138.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.138.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.139.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.139.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.139.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.139.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.139.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.139.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.14.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.14.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.14.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.14.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.14.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.14.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.140.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.140.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.140.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.140.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.140.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.140.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.141.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.141.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.141.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.141.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.141.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.141.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.142.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.142.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.142.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.142.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.142.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.142.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.143.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.143.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.143.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.143.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.143.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.143.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.144.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.144.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.144.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.144.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.144.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.144.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.145.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.145.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.145.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.145.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.145.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.145.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.146.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.146.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.146.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.146.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.146.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.146.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.147.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.147.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.147.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.147.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.147.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.147.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.148.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.148.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.148.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.148.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.148.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.148.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.149.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.149.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.149.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.149.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.149.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.149.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.15.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.15.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.15.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.15.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.15.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.15.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.150.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.150.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.150.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.150.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.150.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.150.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.151.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.151.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.151.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.151.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.151.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.151.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.152.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.152.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.152.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.152.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.152.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.152.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.153.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.153.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.153.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.153.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.153.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.153.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.154.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.154.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.154.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.154.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.154.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.154.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.155.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.155.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.155.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.155.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.155.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.155.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.156.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.156.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.156.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.156.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.156.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.156.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.157.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.157.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.157.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.157.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.157.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.157.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.158.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.158.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.158.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.158.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.158.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.158.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.159.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.159.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.159.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.159.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.159.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.159.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.16.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.16.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.16.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.16.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.16.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.16.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.17.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.17.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.17.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.17.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.17.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.17.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.18.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.18.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.18.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.18.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.18.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.18.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.19.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.19.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.19.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.19.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.19.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.19.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.2.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.2.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.2.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.2.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.2.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.2.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.20.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.20.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.20.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.20.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.20.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.20.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.21.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.21.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.21.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.21.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.21.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.21.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.22.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.22.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.22.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.22.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.22.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.22.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.23.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.23.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.23.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.23.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.23.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.23.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.24.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.24.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.24.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.24.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.24.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.24.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.25.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.25.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.25.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.25.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.25.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.25.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.26.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.26.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.26.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.26.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.26.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.26.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.27.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.27.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.27.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.27.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.27.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.27.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.28.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.28.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.28.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.28.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.28.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.28.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.29.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.29.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.29.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.29.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.29.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.29.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.3.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.3.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.3.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.3.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.3.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.3.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.30.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.30.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.30.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.30.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.30.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.30.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.31.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.31.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.31.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.31.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.31.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.31.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.32.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.32.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.32.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.32.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.32.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.32.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.33.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.33.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.33.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.33.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.33.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.33.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.34.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.34.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.34.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.34.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.34.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.34.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.35.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.35.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.35.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.35.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.35.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.35.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.36.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.36.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.36.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.36.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.36.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.36.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.37.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.37.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.37.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.37.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.37.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.37.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.38.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.38.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.38.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.38.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.38.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.38.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.39.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.39.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.39.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.39.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.39.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.39.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.4.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.4.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.4.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.4.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.4.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.4.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.40.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.40.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.40.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.40.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.40.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.40.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.41.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.41.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.41.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.41.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.41.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.41.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.42.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.42.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.42.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.42.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.42.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.42.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.43.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.43.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.43.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.43.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.43.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.43.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.44.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.44.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.44.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.44.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.44.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.44.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.45.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.45.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.45.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.45.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.45.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.45.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.46.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.46.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.46.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.46.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.46.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.46.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.47.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.47.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.47.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.47.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.47.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.47.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.48.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.48.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.48.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.48.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.48.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.48.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.49.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.49.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.49.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.49.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.49.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.49.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.5.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.5.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.5.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.5.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.5.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.5.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.50.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.50.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.50.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.50.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.50.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.50.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.51.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.51.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.51.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.51.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.51.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.51.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.52.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.52.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.52.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.52.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.52.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.52.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.53.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.53.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.53.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.53.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.53.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.53.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.54.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.54.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.54.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.54.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.54.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.54.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.55.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.55.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.55.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.55.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.55.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.55.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.56.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.56.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.56.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.56.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.56.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.56.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.57.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.57.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.57.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.57.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.57.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.57.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.58.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.58.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.58.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.58.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.58.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.58.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.59.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.59.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.59.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.59.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.59.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.59.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.6.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.6.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.6.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.6.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.6.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.6.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.60.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.60.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.60.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.60.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.60.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.60.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.61.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.61.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.61.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.61.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.61.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.61.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.62.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.62.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.62.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.62.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.62.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.62.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.63.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.63.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.63.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.63.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.63.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.63.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.64.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.64.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.64.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.64.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.64.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.64.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.65.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.65.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.65.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.65.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.65.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.65.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.66.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.66.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.66.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.66.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.66.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.66.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.67.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.67.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.67.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.67.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.67.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.67.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.68.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.68.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.68.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.68.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.68.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.68.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.69.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.69.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.69.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.69.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.69.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.69.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.7.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.7.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.7.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.7.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.7.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.7.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.70.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.70.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.70.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.70.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.70.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.70.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.71.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.71.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.71.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.71.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.71.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.71.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.72.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.72.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.72.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.72.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.72.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.72.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.73.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.73.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.73.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.73.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.73.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.73.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.74.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.74.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.74.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.74.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.74.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.74.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.75.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.75.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.75.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.75.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.75.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.75.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.76.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.76.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.76.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.76.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.76.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.76.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.77.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.77.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.77.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.77.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.77.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.77.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.78.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.78.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.78.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.78.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.78.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.78.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.79.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.79.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.79.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.79.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.79.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.79.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.8.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.8.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.8.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.8.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.8.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.8.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.80.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.80.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.80.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.80.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.80.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.80.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.81.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.81.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.81.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.81.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.81.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.81.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.82.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.82.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.82.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.82.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.82.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.82.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.83.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.83.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.83.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.83.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.83.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.83.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.84.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.84.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.84.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.84.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.84.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.84.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.85.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.85.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.85.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.85.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.85.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.85.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.86.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.86.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.86.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.86.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.86.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.86.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.87.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.87.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.87.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.87.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.87.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.87.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.88.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.88.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.88.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.88.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.88.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.88.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.89.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.89.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.89.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.89.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.89.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.89.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.9.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.9.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.9.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.9.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.9.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.9.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.90.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.90.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.90.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.90.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.90.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.90.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.91.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.91.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.91.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.91.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.91.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.91.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.92.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.92.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.92.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.92.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.92.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.92.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.93.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.93.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.93.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.93.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.93.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.93.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.94.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.94.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.94.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.94.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.94.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.94.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.95.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.95.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.95.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.95.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.95.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.95.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.96.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.96.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.96.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.96.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.96.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.96.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.97.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.97.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.97.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.97.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.97.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.97.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.98.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.98.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.98.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.98.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.98.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.98.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.99.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.99.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.99.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.99.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.99.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.experts.99.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.gate.e_score_correction_bias": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.gate.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.shared_experts.down_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.shared_experts.down_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.shared_experts.gate_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.shared_experts.gate_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.shared_experts.up_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.mlp.shared_experts.up_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.post_attention_layernorm.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.self_attn.k_norm.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.self_attn.k_proj.bias": "model-00004-of-00092.safetensors",
+ "model.layers.3.self_attn.k_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.self_attn.k_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.self_attn.o_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.self_attn.o_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.self_attn.q_norm.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.self_attn.q_proj.bias": "model-00004-of-00092.safetensors",
+ "model.layers.3.self_attn.q_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.self_attn.q_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.3.self_attn.v_proj.bias": "model-00004-of-00092.safetensors",
+ "model.layers.3.self_attn.v_proj.weight": "model-00004-of-00092.safetensors",
+ "model.layers.3.self_attn.v_proj.weight_scale": "model-00004-of-00092.safetensors",
+ "model.layers.30.input_layernorm.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.0.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.0.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.0.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.0.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.0.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.0.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.1.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.1.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.1.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.1.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.1.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.1.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.10.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.10.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.10.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.10.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.10.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.10.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.100.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.100.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.100.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.100.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.100.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.100.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.101.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.101.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.101.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.101.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.101.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.101.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.102.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.102.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.102.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.102.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.102.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.102.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.103.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.103.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.103.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.103.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.103.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.103.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.104.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.104.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.104.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.104.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.104.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.104.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.105.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.105.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.105.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.105.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.105.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.105.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.106.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.106.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.106.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.106.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.106.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.106.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.107.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.107.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.107.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.107.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.107.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.107.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.108.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.108.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.108.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.108.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.108.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.108.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.109.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.109.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.109.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.109.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.109.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.109.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.11.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.11.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.11.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.11.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.11.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.11.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.110.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.110.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.110.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.110.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.110.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.110.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.111.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.111.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.111.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.111.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.111.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.111.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.112.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.112.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.112.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.112.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.112.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.112.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.113.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.113.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.113.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.113.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.113.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.113.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.114.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.114.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.114.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.114.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.114.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.114.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.115.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.115.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.115.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.115.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.115.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.115.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.116.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.116.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.116.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.116.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.116.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.116.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.117.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.117.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.117.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.117.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.117.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.117.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.118.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.118.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.118.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.118.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.118.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.118.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.119.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.119.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.119.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.119.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.119.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.119.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.12.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.12.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.12.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.12.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.12.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.12.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.120.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.120.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.120.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.120.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.120.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.120.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.121.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.121.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.121.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.121.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.121.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.121.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.122.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.122.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.122.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.122.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.122.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.122.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.123.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.123.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.123.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.123.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.123.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.123.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.124.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.124.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.124.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.124.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.124.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.124.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.125.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.125.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.125.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.125.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.125.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.125.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.126.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.126.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.126.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.126.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.126.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.126.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.127.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.127.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.127.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.127.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.127.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.127.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.128.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.128.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.128.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.128.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.128.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.128.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.129.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.129.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.129.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.129.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.129.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.129.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.13.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.13.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.13.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.13.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.13.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.13.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.130.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.130.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.130.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.130.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.130.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.130.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.131.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.131.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.131.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.131.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.131.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.131.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.132.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.132.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.132.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.132.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.132.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.132.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.133.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.133.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.133.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.133.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.133.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.133.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.134.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.134.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.134.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.134.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.134.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.134.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.135.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.135.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.135.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.135.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.135.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.135.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.136.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.136.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.136.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.136.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.136.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.136.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.137.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.137.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.137.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.137.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.137.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.137.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.138.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.138.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.138.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.138.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.138.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.138.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.139.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.139.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.139.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.139.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.139.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.139.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.14.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.14.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.14.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.14.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.14.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.14.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.140.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.140.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.140.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.140.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.140.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.140.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.141.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.141.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.141.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.141.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.141.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.141.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.142.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.142.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.142.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.142.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.142.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.142.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.143.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.143.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.143.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.143.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.143.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.143.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.144.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.144.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.144.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.144.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.144.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.144.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.145.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.145.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.145.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.145.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.145.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.145.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.146.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.146.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.146.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.146.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.146.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.146.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.147.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.147.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.147.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.147.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.147.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.147.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.148.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.148.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.148.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.148.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.148.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.148.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.149.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.149.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.149.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.149.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.149.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.149.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.15.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.15.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.15.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.15.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.15.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.15.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.150.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.150.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.150.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.150.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.150.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.150.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.151.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.151.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.151.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.151.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.151.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.151.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.152.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.152.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.152.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.152.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.152.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.152.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.153.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.153.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.153.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.153.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.153.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.153.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.154.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.154.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.154.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.154.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.154.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.154.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.155.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.155.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.155.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.155.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.155.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.155.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.156.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.156.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.156.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.156.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.156.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.156.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.157.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.157.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.157.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.157.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.157.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.157.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.158.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.158.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.158.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.158.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.158.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.158.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.159.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.159.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.159.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.159.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.159.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.159.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.16.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.16.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.16.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.16.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.16.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.16.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.17.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.17.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.17.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.17.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.17.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.17.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.18.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.18.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.18.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.18.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.18.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.18.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.19.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.19.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.19.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.19.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.19.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.19.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.2.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.2.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.2.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.2.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.2.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.2.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.20.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.20.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.20.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.20.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.20.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.20.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.21.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.21.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.21.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.21.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.21.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.21.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.22.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.22.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.22.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.22.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.22.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.22.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.23.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.23.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.23.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.23.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.23.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.23.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.24.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.24.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.24.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.24.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.24.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.24.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.25.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.25.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.25.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.25.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.25.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.25.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.26.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.26.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.26.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.26.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.26.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.26.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.27.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.27.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.27.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.27.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.27.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.27.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.28.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.28.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.28.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.28.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.28.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.28.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.29.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.29.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.29.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.29.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.29.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.29.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.3.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.3.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.3.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.3.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.3.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.3.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.30.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.30.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.30.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.30.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.30.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.30.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.31.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.31.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.31.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.31.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.31.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.31.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.32.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.32.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.32.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.32.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.32.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.32.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.33.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.33.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.33.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.33.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.33.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.33.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.34.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.34.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.34.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.34.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.34.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.34.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.35.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.35.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.35.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.35.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.35.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.35.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.36.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.36.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.36.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.36.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.36.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.36.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.37.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.37.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.37.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.37.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.37.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.37.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.38.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.38.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.38.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.38.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.38.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.38.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.39.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.39.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.39.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.39.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.39.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.39.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.4.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.4.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.4.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.4.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.4.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.4.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.40.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.40.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.40.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.40.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.40.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.40.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.41.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.41.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.41.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.41.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.41.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.41.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.42.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.42.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.42.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.42.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.42.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.42.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.43.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.43.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.43.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.43.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.43.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.43.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.44.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.44.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.44.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.44.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.44.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.44.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.45.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.45.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.45.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.45.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.45.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.45.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.46.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.46.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.46.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.46.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.46.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.46.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.47.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.47.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.47.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.47.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.47.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.47.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.48.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.48.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.48.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.48.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.48.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.48.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.49.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.49.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.49.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.49.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.49.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.49.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.5.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.5.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.5.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.5.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.5.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.5.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.50.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.50.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.50.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.50.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.50.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.50.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.51.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.51.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.51.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.51.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.51.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.51.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.52.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.52.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.52.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.52.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.52.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.52.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.53.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.53.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.53.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.53.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.53.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.53.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.54.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.54.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.54.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.54.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.54.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.54.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.55.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.55.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.55.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.55.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.55.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.55.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.56.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.56.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.56.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.56.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.56.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.56.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.57.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.57.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.57.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.57.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.57.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.57.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.58.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.58.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.58.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.58.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.58.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.58.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.59.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.59.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.59.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.59.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.59.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.59.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.6.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.6.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.6.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.6.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.6.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.6.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.60.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.60.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.60.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.60.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.60.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.60.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.61.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.61.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.61.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.61.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.61.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.61.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.62.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.62.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.62.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.62.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.62.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.62.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.63.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.63.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.63.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.63.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.63.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.63.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.64.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.64.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.64.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.64.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.64.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.64.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.65.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.65.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.65.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.65.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.65.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.65.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.66.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.66.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.66.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.66.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.66.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.66.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.67.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.67.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.67.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.67.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.67.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.67.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.68.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.68.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.68.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.68.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.68.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.68.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.69.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.69.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.69.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.69.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.69.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.69.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.7.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.7.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.7.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.7.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.7.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.7.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.70.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.70.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.70.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.70.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.70.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.70.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.71.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.71.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.71.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.71.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.71.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.71.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.72.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.72.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.72.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.72.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.72.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.72.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.73.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.73.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.73.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.73.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.73.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.73.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.74.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.74.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.74.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.74.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.74.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.74.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.75.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.75.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.75.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.75.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.75.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.75.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.76.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.76.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.76.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.76.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.76.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.76.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.77.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.77.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.77.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.77.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.77.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.77.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.78.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.78.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.78.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.78.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.78.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.78.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.79.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.79.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.79.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.79.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.79.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.79.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.8.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.8.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.8.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.8.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.8.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.8.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.80.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.80.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.80.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.80.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.80.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.80.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.81.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.81.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.81.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.81.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.81.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.81.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.82.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.82.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.82.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.82.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.82.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.82.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.83.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.83.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.83.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.83.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.83.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.83.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.84.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.84.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.84.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.84.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.84.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.84.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.85.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.85.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.85.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.85.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.85.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.85.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.86.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.86.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.86.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.86.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.86.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.86.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.87.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.87.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.87.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.87.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.87.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.87.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.88.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.88.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.88.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.88.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.88.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.88.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.89.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.89.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.89.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.89.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.89.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.89.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.9.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.9.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.9.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.9.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.9.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.9.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.90.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.90.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.90.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.90.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.90.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.90.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.91.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.91.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.91.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.91.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.91.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.91.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.92.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.92.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.92.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.92.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.92.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.92.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.93.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.93.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.93.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.93.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.93.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.93.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.94.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.94.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.94.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.94.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.94.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.94.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.95.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.95.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.95.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.95.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.95.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.95.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.96.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.96.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.96.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.96.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.96.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.96.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.97.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.97.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.97.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.97.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.97.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.97.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.98.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.98.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.98.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.98.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.98.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.98.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.99.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.99.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.99.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.99.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.99.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.experts.99.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.gate.e_score_correction_bias": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.gate.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.shared_experts.down_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.shared_experts.down_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.shared_experts.gate_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.shared_experts.gate_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.shared_experts.up_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.mlp.shared_experts.up_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.post_attention_layernorm.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.self_attn.k_norm.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.self_attn.k_proj.bias": "model-00031-of-00092.safetensors",
+ "model.layers.30.self_attn.k_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.self_attn.k_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.self_attn.o_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.self_attn.o_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.self_attn.q_norm.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.self_attn.q_proj.bias": "model-00031-of-00092.safetensors",
+ "model.layers.30.self_attn.q_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.self_attn.q_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.30.self_attn.v_proj.bias": "model-00031-of-00092.safetensors",
+ "model.layers.30.self_attn.v_proj.weight": "model-00031-of-00092.safetensors",
+ "model.layers.30.self_attn.v_proj.weight_scale": "model-00031-of-00092.safetensors",
+ "model.layers.31.input_layernorm.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.0.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.0.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.0.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.0.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.0.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.0.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.1.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.1.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.1.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.1.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.1.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.1.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.10.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.10.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.10.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.10.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.10.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.10.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.100.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.100.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.100.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.100.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.100.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.100.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.101.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.101.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.101.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.101.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.101.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.101.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.102.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.102.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.102.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.102.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.102.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.102.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.103.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.103.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.103.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.103.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.103.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.103.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.104.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.104.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.104.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.104.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.104.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.104.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.105.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.105.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.105.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.105.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.105.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.105.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.106.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.106.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.106.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.106.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.106.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.106.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.107.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.107.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.107.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.107.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.107.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.107.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.108.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.108.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.108.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.108.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.108.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.108.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.109.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.109.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.109.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.109.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.109.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.109.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.11.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.11.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.11.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.11.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.11.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.11.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.110.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.110.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.110.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.110.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.110.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.110.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.111.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.111.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.111.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.111.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.111.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.111.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.112.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.112.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.112.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.112.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.112.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.112.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.113.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.113.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.113.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.113.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.113.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.113.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.114.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.114.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.114.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.114.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.114.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.114.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.115.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.115.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.115.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.115.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.115.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.115.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.116.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.116.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.116.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.116.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.116.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.116.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.117.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.117.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.117.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.117.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.117.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.117.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.118.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.118.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.118.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.118.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.118.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.118.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.119.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.119.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.119.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.119.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.119.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.119.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.12.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.12.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.12.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.12.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.12.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.12.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.120.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.120.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.120.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.120.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.120.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.120.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.121.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.121.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.121.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.121.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.121.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.121.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.122.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.122.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.122.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.122.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.122.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.122.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.123.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.123.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.123.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.123.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.123.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.123.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.124.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.124.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.124.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.124.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.124.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.124.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.125.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.125.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.125.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.125.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.125.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.125.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.126.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.126.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.126.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.126.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.126.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.126.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.127.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.127.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.127.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.127.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.127.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.127.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.128.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.128.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.128.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.128.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.128.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.128.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.129.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.129.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.129.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.129.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.129.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.129.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.13.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.13.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.13.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.13.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.13.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.13.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.130.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.130.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.130.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.130.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.130.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.130.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.131.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.131.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.131.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.131.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.131.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.131.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.132.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.132.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.132.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.132.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.132.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.132.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.133.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.133.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.133.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.133.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.133.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.133.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.134.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.134.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.134.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.134.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.134.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.134.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.135.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.135.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.135.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.135.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.135.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.135.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.136.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.136.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.136.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.136.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.136.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.136.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.137.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.137.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.137.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.137.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.137.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.137.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.138.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.138.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.138.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.138.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.138.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.138.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.139.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.139.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.139.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.139.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.139.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.139.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.14.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.14.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.14.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.14.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.14.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.14.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.140.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.140.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.140.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.140.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.140.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.140.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.141.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.141.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.141.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.141.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.141.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.141.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.142.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.142.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.142.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.142.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.142.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.142.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.143.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.143.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.143.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.143.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.143.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.143.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.144.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.144.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.144.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.144.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.144.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.144.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.145.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.145.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.145.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.145.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.145.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.145.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.146.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.146.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.146.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.146.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.146.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.146.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.147.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.147.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.147.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.147.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.147.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.147.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.148.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.148.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.148.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.148.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.148.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.148.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.149.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.149.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.149.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.149.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.149.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.149.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.15.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.15.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.15.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.15.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.15.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.15.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.150.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.150.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.150.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.150.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.150.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.150.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.151.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.151.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.151.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.151.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.151.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.151.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.152.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.152.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.152.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.152.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.152.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.152.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.153.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.153.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.153.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.153.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.153.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.153.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.154.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.154.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.154.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.154.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.154.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.154.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.155.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.155.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.155.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.155.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.155.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.155.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.156.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.156.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.156.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.156.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.156.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.156.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.157.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.157.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.157.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.157.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.157.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.157.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.158.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.158.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.158.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.158.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.158.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.158.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.159.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.159.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.159.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.159.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.159.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.159.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.16.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.16.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.16.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.16.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.16.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.16.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.17.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.17.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.17.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.17.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.17.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.17.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.18.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.18.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.18.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.18.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.18.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.18.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.19.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.19.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.19.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.19.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.19.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.19.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.2.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.2.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.2.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.2.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.2.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.2.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.20.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.20.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.20.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.20.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.20.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.20.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.21.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.21.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.21.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.21.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.21.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.21.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.22.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.22.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.22.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.22.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.22.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.22.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.23.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.23.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.23.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.23.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.23.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.23.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.24.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.24.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.24.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.24.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.24.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.24.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.25.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.25.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.25.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.25.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.25.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.25.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.26.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.26.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.26.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.26.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.26.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.26.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.27.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.27.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.27.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.27.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.27.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.27.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.28.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.28.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.28.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.28.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.28.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.28.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.29.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.29.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.29.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.29.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.29.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.29.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.3.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.3.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.3.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.3.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.3.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.3.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.30.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.30.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.30.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.30.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.30.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.30.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.31.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.31.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.31.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.31.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.31.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.31.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.32.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.32.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.32.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.32.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.32.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.32.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.33.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.33.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.33.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.33.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.33.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.33.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.34.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.34.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.34.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.34.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.34.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.34.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.35.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.35.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.35.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.35.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.35.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.35.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.36.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.36.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.36.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.36.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.36.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.36.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.37.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.37.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.37.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.37.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.37.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.37.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.38.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.38.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.38.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.38.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.38.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.38.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.39.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.39.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.39.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.39.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.39.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.39.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.4.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.4.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.4.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.4.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.4.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.4.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.40.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.40.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.40.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.40.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.40.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.40.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.41.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.41.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.41.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.41.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.41.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.41.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.42.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.42.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.42.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.42.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.42.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.42.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.43.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.43.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.43.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.43.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.43.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.43.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.44.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.44.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.44.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.44.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.44.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.44.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.45.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.45.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.45.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.45.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.45.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.45.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.46.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.46.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.46.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.46.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.46.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.46.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.47.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.47.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.47.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.47.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.47.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.47.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.48.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.48.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.48.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.48.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.48.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.48.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.49.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.49.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.49.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.49.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.49.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.49.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.5.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.5.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.5.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.5.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.5.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.5.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.50.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.50.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.50.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.50.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.50.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.50.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.51.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.51.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.51.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.51.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.51.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.51.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.52.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.52.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.52.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.52.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.52.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.52.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.53.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.53.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.53.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.53.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.53.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.53.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.54.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.54.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.54.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.54.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.54.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.54.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.55.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.55.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.55.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.55.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.55.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.55.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.56.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.56.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.56.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.56.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.56.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.56.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.57.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.57.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.57.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.57.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.57.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.57.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.58.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.58.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.58.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.58.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.58.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.58.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.59.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.59.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.59.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.59.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.59.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.59.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.6.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.6.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.6.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.6.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.6.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.6.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.60.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.60.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.60.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.60.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.60.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.60.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.61.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.61.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.61.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.61.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.61.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.61.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.62.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.62.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.62.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.62.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.62.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.62.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.63.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.63.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.63.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.63.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.63.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.63.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.64.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.64.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.64.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.64.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.64.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.64.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.65.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.65.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.65.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.65.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.65.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.65.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.66.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.66.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.66.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.66.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.66.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.66.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.67.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.67.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.67.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.67.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.67.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.67.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.68.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.68.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.68.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.68.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.68.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.68.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.69.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.69.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.69.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.69.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.69.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.69.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.7.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.7.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.7.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.7.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.7.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.7.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.70.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.70.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.70.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.70.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.70.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.70.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.71.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.71.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.71.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.71.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.71.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.71.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.72.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.72.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.72.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.72.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.72.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.72.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.73.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.73.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.73.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.73.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.73.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.73.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.74.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.74.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.74.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.74.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.74.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.74.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.75.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.75.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.75.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.75.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.75.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.75.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.76.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.76.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.76.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.76.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.76.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.76.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.77.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.77.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.77.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.77.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.77.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.77.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.78.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.78.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.78.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.78.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.78.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.78.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.79.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.79.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.79.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.79.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.79.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.79.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.8.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.8.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.8.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.8.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.8.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.8.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.80.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.80.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.80.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.80.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.80.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.80.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.81.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.81.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.81.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.81.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.81.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.81.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.82.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.82.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.82.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.82.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.82.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.82.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.83.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.83.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.83.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.83.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.83.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.83.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.84.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.84.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.84.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.84.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.84.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.84.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.85.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.85.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.85.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.85.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.85.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.85.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.86.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.86.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.86.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.86.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.86.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.86.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.87.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.87.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.87.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.87.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.87.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.87.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.88.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.88.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.88.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.88.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.88.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.88.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.89.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.89.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.89.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.89.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.89.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.89.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.9.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.9.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.9.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.9.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.9.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.9.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.90.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.90.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.90.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.90.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.90.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.90.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.91.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.91.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.91.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.91.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.91.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.91.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.92.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.92.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.92.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.92.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.92.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.92.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.93.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.93.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.93.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.93.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.93.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.93.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.94.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.94.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.94.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.94.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.94.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.94.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.95.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.95.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.95.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.95.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.95.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.95.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.96.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.96.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.96.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.96.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.96.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.96.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.97.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.97.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.97.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.97.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.97.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.97.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.98.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.98.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.98.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.98.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.98.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.98.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.99.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.99.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.99.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.99.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.99.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.experts.99.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.gate.e_score_correction_bias": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.gate.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.shared_experts.down_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.shared_experts.down_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.shared_experts.gate_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.shared_experts.gate_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.shared_experts.up_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.mlp.shared_experts.up_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.post_attention_layernorm.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.self_attn.k_norm.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.self_attn.k_proj.bias": "model-00032-of-00092.safetensors",
+ "model.layers.31.self_attn.k_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.self_attn.k_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.self_attn.o_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.self_attn.o_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.self_attn.q_norm.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.self_attn.q_proj.bias": "model-00032-of-00092.safetensors",
+ "model.layers.31.self_attn.q_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.self_attn.q_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.31.self_attn.v_proj.bias": "model-00032-of-00092.safetensors",
+ "model.layers.31.self_attn.v_proj.weight": "model-00032-of-00092.safetensors",
+ "model.layers.31.self_attn.v_proj.weight_scale": "model-00032-of-00092.safetensors",
+ "model.layers.32.input_layernorm.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.0.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.0.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.0.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.0.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.0.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.0.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.1.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.1.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.1.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.1.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.1.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.1.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.10.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.10.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.10.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.10.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.10.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.10.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.100.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.100.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.100.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.100.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.100.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.100.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.101.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.101.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.101.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.101.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.101.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.101.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.102.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.102.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.102.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.102.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.102.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.102.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.103.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.103.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.103.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.103.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.103.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.103.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.104.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.104.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.104.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.104.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.104.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.104.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.105.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.105.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.105.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.105.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.105.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.105.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.106.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.106.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.106.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.106.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.106.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.106.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.107.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.107.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.107.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.107.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.107.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.107.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.108.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.108.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.108.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.108.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.108.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.108.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.109.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.109.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.109.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.109.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.109.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.109.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.11.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.11.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.11.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.11.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.11.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.11.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.110.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.110.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.110.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.110.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.110.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.110.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.111.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.111.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.111.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.111.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.111.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.111.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.112.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.112.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.112.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.112.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.112.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.112.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.113.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.113.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.113.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.113.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.113.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.113.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.114.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.114.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.114.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.114.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.114.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.114.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.115.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.115.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.115.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.115.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.115.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.115.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.116.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.116.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.116.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.116.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.116.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.116.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.117.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.117.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.117.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.117.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.117.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.117.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.118.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.118.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.118.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.118.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.118.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.118.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.119.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.119.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.119.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.119.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.119.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.119.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.12.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.12.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.12.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.12.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.12.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.12.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.120.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.120.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.120.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.120.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.120.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.120.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.121.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.121.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.121.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.121.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.121.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.121.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.122.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.122.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.122.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.122.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.122.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.122.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.123.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.123.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.123.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.123.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.123.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.123.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.124.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.124.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.124.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.124.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.124.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.124.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.125.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.125.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.125.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.125.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.125.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.125.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.126.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.126.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.126.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.126.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.126.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.126.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.127.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.127.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.127.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.127.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.127.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.127.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.128.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.128.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.128.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.128.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.128.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.128.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.129.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.129.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.129.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.129.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.129.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.129.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.13.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.13.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.13.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.13.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.13.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.13.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.130.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.130.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.130.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.130.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.130.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.130.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.131.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.131.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.131.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.131.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.131.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.131.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.132.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.132.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.132.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.132.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.132.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.132.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.133.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.133.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.133.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.133.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.133.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.133.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.134.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.134.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.134.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.134.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.134.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.134.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.135.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.135.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.135.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.135.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.135.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.135.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.136.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.136.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.136.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.136.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.136.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.136.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.137.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.137.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.137.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.137.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.137.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.137.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.138.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.138.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.138.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.138.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.138.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.138.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.139.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.139.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.139.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.139.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.139.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.139.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.14.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.14.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.14.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.14.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.14.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.14.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.140.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.140.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.140.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.140.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.140.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.140.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.141.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.141.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.141.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.141.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.141.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.141.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.142.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.142.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.142.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.142.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.142.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.142.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.143.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.143.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.143.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.143.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.143.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.143.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.144.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.144.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.144.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.144.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.144.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.144.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.145.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.145.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.145.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.145.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.145.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.145.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.146.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.146.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.146.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.146.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.146.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.146.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.147.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.147.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.147.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.147.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.147.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.147.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.148.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.148.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.148.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.148.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.148.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.148.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.149.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.149.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.149.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.149.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.149.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.149.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.15.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.15.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.15.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.15.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.15.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.15.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.150.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.150.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.150.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.150.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.150.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.150.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.151.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.151.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.151.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.151.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.151.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.151.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.152.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.152.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.152.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.152.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.152.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.152.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.153.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.153.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.153.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.153.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.153.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.153.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.154.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.154.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.154.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.154.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.154.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.154.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.155.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.155.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.155.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.155.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.155.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.155.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.156.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.156.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.156.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.156.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.156.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.156.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.157.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.157.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.157.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.157.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.157.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.157.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.158.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.158.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.158.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.158.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.158.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.158.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.159.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.159.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.159.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.159.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.159.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.159.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.16.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.16.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.16.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.16.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.16.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.16.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.17.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.17.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.17.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.17.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.17.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.17.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.18.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.18.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.18.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.18.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.18.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.18.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.19.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.19.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.19.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.19.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.19.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.19.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.2.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.2.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.2.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.2.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.2.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.2.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.20.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.20.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.20.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.20.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.20.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.20.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.21.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.21.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.21.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.21.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.21.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.21.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.22.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.22.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.22.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.22.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.22.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.22.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.23.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.23.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.23.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.23.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.23.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.23.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.24.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.24.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.24.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.24.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.24.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.24.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.25.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.25.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.25.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.25.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.25.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.25.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.26.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.26.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.26.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.26.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.26.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.26.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.27.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.27.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.27.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.27.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.27.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.27.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.28.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.28.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.28.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.28.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.28.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.28.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.29.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.29.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.29.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.29.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.29.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.29.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.3.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.3.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.3.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.3.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.3.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.3.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.30.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.30.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.30.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.30.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.30.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.30.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.31.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.31.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.31.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.31.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.31.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.31.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.32.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.32.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.32.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.32.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.32.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.32.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.33.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.33.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.33.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.33.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.33.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.33.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.34.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.34.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.34.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.34.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.34.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.34.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.35.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.35.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.35.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.35.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.35.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.35.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.36.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.36.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.36.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.36.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.36.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.36.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.37.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.37.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.37.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.37.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.37.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.37.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.38.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.38.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.38.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.38.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.38.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.38.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.39.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.39.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.39.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.39.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.39.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.39.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.4.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.4.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.4.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.4.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.4.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.4.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.40.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.40.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.40.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.40.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.40.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.40.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.41.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.41.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.41.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.41.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.41.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.41.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.42.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.42.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.42.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.42.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.42.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.42.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.43.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.43.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.43.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.43.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.43.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.43.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.44.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.44.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.44.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.44.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.44.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.44.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.45.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.45.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.45.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.45.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.45.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.45.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.46.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.46.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.46.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.46.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.46.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.46.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.47.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.47.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.47.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.47.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.47.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.47.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.48.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.48.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.48.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.48.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.48.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.48.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.49.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.49.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.49.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.49.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.49.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.49.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.5.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.5.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.5.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.5.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.5.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.5.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.50.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.50.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.50.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.50.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.50.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.50.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.51.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.51.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.51.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.51.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.51.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.51.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.52.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.52.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.52.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.52.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.52.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.52.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.53.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.53.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.53.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.53.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.53.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.53.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.54.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.54.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.54.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.54.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.54.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.54.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.55.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.55.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.55.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.55.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.55.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.55.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.56.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.56.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.56.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.56.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.56.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.56.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.57.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.57.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.57.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.57.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.57.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.57.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.58.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.58.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.58.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.58.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.58.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.58.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.59.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.59.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.59.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.59.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.59.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.59.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.6.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.6.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.6.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.6.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.6.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.6.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.60.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.60.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.60.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.60.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.60.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.60.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.61.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.61.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.61.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.61.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.61.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.61.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.62.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.62.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.62.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.62.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.62.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.62.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.63.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.63.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.63.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.63.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.63.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.63.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.64.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.64.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.64.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.64.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.64.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.64.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.65.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.65.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.65.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.65.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.65.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.65.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.66.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.66.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.66.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.66.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.66.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.66.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.67.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.67.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.67.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.67.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.67.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.67.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.68.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.68.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.68.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.68.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.68.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.68.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.69.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.69.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.69.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.69.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.69.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.69.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.7.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.7.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.7.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.7.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.7.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.7.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.70.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.70.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.70.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.70.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.70.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.70.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.71.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.71.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.71.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.71.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.71.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.71.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.72.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.72.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.72.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.72.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.72.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.72.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.73.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.73.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.73.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.73.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.73.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.73.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.74.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.74.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.74.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.74.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.74.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.74.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.75.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.75.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.75.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.75.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.75.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.75.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.76.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.76.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.76.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.76.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.76.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.76.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.77.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.77.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.77.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.77.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.77.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.77.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.78.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.78.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.78.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.78.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.78.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.78.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.79.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.79.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.79.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.79.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.79.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.79.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.8.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.8.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.8.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.8.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.8.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.8.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.80.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.80.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.80.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.80.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.80.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.80.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.81.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.81.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.81.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.81.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.81.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.81.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.82.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.82.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.82.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.82.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.82.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.82.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.83.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.83.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.83.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.83.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.83.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.83.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.84.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.84.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.84.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.84.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.84.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.84.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.85.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.85.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.85.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.85.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.85.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.85.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.86.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.86.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.86.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.86.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.86.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.86.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.87.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.87.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.87.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.87.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.87.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.87.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.88.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.88.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.88.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.88.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.88.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.88.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.89.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.89.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.89.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.89.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.89.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.89.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.9.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.9.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.9.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.9.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.9.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.9.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.90.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.90.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.90.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.90.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.90.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.90.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.91.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.91.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.91.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.91.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.91.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.91.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.92.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.92.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.92.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.92.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.92.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.92.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.93.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.93.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.93.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.93.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.93.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.93.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.94.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.94.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.94.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.94.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.94.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.94.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.95.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.95.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.95.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.95.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.95.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.95.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.96.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.96.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.96.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.96.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.96.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.96.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.97.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.97.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.97.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.97.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.97.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.97.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.98.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.98.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.98.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.98.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.98.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.98.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.99.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.99.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.99.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.99.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.99.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.experts.99.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.gate.e_score_correction_bias": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.gate.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.shared_experts.down_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.shared_experts.down_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.shared_experts.gate_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.shared_experts.gate_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.shared_experts.up_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.mlp.shared_experts.up_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.post_attention_layernorm.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.self_attn.k_norm.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.self_attn.k_proj.bias": "model-00033-of-00092.safetensors",
+ "model.layers.32.self_attn.k_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.self_attn.k_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.self_attn.o_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.self_attn.o_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.self_attn.q_norm.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.self_attn.q_proj.bias": "model-00033-of-00092.safetensors",
+ "model.layers.32.self_attn.q_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.self_attn.q_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.32.self_attn.v_proj.bias": "model-00033-of-00092.safetensors",
+ "model.layers.32.self_attn.v_proj.weight": "model-00033-of-00092.safetensors",
+ "model.layers.32.self_attn.v_proj.weight_scale": "model-00033-of-00092.safetensors",
+ "model.layers.33.input_layernorm.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.0.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.0.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.0.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.0.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.0.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.0.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.1.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.1.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.1.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.1.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.1.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.1.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.10.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.10.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.10.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.10.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.10.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.10.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.100.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.100.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.100.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.100.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.100.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.100.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.101.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.101.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.101.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.101.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.101.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.101.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.102.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.102.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.102.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.102.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.102.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.102.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.103.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.103.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.103.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.103.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.103.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.103.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.104.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.104.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.104.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.104.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.104.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.104.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.105.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.105.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.105.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.105.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.105.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.105.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.106.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.106.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.106.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.106.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.106.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.106.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.107.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.107.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.107.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.107.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.107.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.107.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.108.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.108.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.108.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.108.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.108.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.108.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.109.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.109.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.109.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.109.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.109.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.109.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.11.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.11.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.11.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.11.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.11.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.11.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.110.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.110.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.110.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.110.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.110.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.110.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.111.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.111.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.111.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.111.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.111.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.111.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.112.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.112.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.112.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.112.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.112.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.112.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.113.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.113.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.113.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.113.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.113.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.113.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.114.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.114.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.114.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.114.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.114.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.114.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.115.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.115.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.115.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.115.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.115.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.115.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.116.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.116.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.116.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.116.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.116.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.116.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.117.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.117.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.117.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.117.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.117.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.117.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.118.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.118.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.118.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.118.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.118.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.118.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.119.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.119.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.119.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.119.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.119.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.119.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.12.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.12.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.12.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.12.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.12.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.12.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.120.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.120.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.120.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.120.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.120.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.120.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.121.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.121.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.121.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.121.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.121.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.121.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.122.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.122.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.122.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.122.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.122.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.122.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.123.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.123.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.123.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.123.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.123.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.123.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.124.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.124.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.124.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.124.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.124.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.124.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.125.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.125.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.125.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.125.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.125.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.125.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.126.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.126.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.126.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.126.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.126.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.126.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.127.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.127.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.127.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.127.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.127.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.127.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.128.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.128.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.128.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.128.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.128.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.128.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.129.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.129.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.129.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.129.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.129.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.129.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.13.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.13.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.13.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.13.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.13.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.13.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.130.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.130.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.130.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.130.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.130.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.130.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.131.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.131.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.131.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.131.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.131.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.131.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.132.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.132.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.132.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.132.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.132.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.132.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.133.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.133.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.133.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.133.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.133.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.133.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.134.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.134.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.134.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.134.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.134.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.134.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.135.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.135.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.135.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.135.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.135.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.135.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.136.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.136.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.136.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.136.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.136.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.136.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.137.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.137.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.137.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.137.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.137.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.137.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.138.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.138.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.138.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.138.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.138.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.138.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.139.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.139.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.139.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.139.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.139.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.139.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.14.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.14.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.14.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.14.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.14.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.14.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.140.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.140.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.140.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.140.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.140.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.140.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.141.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.141.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.141.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.141.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.141.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.141.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.142.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.142.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.142.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.142.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.142.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.142.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.143.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.143.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.143.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.143.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.143.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.143.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.144.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.144.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.144.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.144.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.144.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.144.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.145.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.145.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.145.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.145.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.145.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.145.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.146.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.146.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.146.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.146.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.146.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.146.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.147.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.147.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.147.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.147.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.147.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.147.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.148.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.148.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.148.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.148.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.148.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.148.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.149.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.149.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.149.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.149.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.149.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.149.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.15.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.15.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.15.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.15.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.15.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.15.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.150.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.150.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.150.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.150.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.150.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.150.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.151.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.151.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.151.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.151.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.151.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.151.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.152.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.152.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.152.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.152.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.152.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.152.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.153.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.153.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.153.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.153.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.153.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.153.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.154.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.154.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.154.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.154.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.154.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.154.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.155.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.155.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.155.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.155.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.155.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.155.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.156.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.156.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.156.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.156.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.156.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.156.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.157.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.157.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.157.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.157.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.157.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.157.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.158.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.158.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.158.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.158.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.158.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.158.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.159.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.159.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.159.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.159.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.159.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.159.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.16.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.16.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.16.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.16.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.16.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.16.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.17.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.17.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.17.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.17.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.17.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.17.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.18.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.18.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.18.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.18.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.18.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.18.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.19.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.19.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.19.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.19.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.19.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.19.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.2.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.2.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.2.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.2.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.2.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.2.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.20.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.20.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.20.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.20.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.20.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.20.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.21.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.21.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.21.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.21.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.21.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.21.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.22.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.22.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.22.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.22.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.22.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.22.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.23.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.23.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.23.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.23.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.23.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.23.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.24.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.24.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.24.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.24.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.24.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.24.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.25.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.25.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.25.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.25.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.25.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.25.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.26.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.26.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.26.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.26.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.26.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.26.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.27.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.27.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.27.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.27.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.27.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.27.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.28.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.28.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.28.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.28.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.28.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.28.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.29.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.29.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.29.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.29.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.29.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.29.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.3.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.3.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.3.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.3.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.3.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.3.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.30.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.30.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.30.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.30.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.30.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.30.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.31.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.31.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.31.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.31.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.31.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.31.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.32.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.32.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.32.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.32.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.32.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.32.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.33.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.33.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.33.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.33.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.33.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.33.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.34.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.34.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.34.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.34.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.34.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.34.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.35.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.35.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.35.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.35.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.35.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.35.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.36.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.36.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.36.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.36.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.36.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.36.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.37.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.37.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.37.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.37.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.37.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.37.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.38.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.38.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.38.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.38.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.38.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.38.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.39.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.39.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.39.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.39.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.39.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.39.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.4.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.4.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.4.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.4.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.4.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.4.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.40.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.40.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.40.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.40.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.40.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.40.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.41.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.41.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.41.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.41.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.41.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.41.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.42.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.42.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.42.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.42.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.42.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.42.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.43.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.43.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.43.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.43.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.43.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.43.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.44.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.44.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.44.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.44.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.44.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.44.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.45.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.45.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.45.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.45.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.45.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.45.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.46.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.46.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.46.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.46.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.46.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.46.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.47.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.47.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.47.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.47.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.47.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.47.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.48.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.48.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.48.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.48.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.48.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.48.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.49.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.49.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.49.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.49.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.49.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.49.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.5.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.5.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.5.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.5.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.5.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.5.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.50.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.50.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.50.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.50.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.50.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.50.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.51.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.51.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.51.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.51.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.51.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.51.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.52.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.52.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.52.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.52.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.52.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.52.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.53.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.53.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.53.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.53.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.53.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.53.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.54.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.54.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.54.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.54.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.54.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.54.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.55.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.55.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.55.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.55.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.55.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.55.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.56.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.56.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.56.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.56.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.56.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.56.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.57.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.57.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.57.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.57.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.57.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.57.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.58.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.58.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.58.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.58.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.58.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.58.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.59.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.59.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.59.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.59.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.59.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.59.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.6.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.6.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.6.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.6.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.6.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.6.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.60.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.60.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.60.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.60.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.60.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.60.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.61.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.61.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.61.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.61.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.61.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.61.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.62.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.62.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.62.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.62.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.62.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.62.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.63.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.63.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.63.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.63.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.63.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.63.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.64.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.64.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.64.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.64.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.64.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.64.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.65.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.65.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.65.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.65.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.65.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.65.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.66.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.66.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.66.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.66.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.66.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.66.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.67.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.67.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.67.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.67.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.67.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.67.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.68.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.68.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.68.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.68.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.68.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.68.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.69.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.69.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.69.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.69.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.69.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.69.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.7.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.7.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.7.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.7.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.7.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.7.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.70.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.70.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.70.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.70.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.70.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.70.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.71.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.71.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.71.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.71.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.71.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.71.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.72.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.72.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.72.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.72.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.72.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.72.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.73.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.73.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.73.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.73.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.73.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.73.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.74.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.74.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.74.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.74.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.74.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.74.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.75.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.75.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.75.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.75.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.75.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.75.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.76.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.76.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.76.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.76.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.76.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.76.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.77.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.77.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.77.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.77.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.77.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.77.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.78.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.78.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.78.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.78.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.78.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.78.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.79.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.79.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.79.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.79.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.79.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.79.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.8.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.8.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.8.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.8.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.8.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.8.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.80.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.80.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.80.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.80.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.80.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.80.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.81.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.81.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.81.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.81.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.81.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.81.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.82.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.82.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.82.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.82.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.82.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.82.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.83.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.83.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.83.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.83.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.83.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.83.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.84.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.84.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.84.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.84.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.84.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.84.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.85.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.85.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.85.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.85.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.85.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.85.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.86.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.86.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.86.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.86.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.86.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.86.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.87.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.87.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.87.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.87.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.87.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.87.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.88.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.88.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.88.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.88.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.88.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.88.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.89.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.89.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.89.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.89.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.89.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.89.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.9.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.9.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.9.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.9.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.9.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.9.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.90.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.90.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.90.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.90.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.90.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.90.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.91.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.91.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.91.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.91.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.91.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.91.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.92.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.92.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.92.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.92.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.92.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.92.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.93.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.93.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.93.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.93.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.93.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.93.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.94.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.94.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.94.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.94.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.94.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.94.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.95.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.95.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.95.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.95.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.95.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.95.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.96.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.96.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.96.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.96.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.96.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.96.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.97.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.97.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.97.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.97.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.97.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.97.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.98.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.98.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.98.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.98.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.98.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.98.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.99.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.99.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.99.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.99.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.99.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.experts.99.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.gate.e_score_correction_bias": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.gate.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.shared_experts.down_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.shared_experts.down_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.shared_experts.gate_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.shared_experts.gate_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.shared_experts.up_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.mlp.shared_experts.up_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.post_attention_layernorm.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.self_attn.k_norm.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.self_attn.k_proj.bias": "model-00034-of-00092.safetensors",
+ "model.layers.33.self_attn.k_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.self_attn.k_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.self_attn.o_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.self_attn.o_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.self_attn.q_norm.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.self_attn.q_proj.bias": "model-00034-of-00092.safetensors",
+ "model.layers.33.self_attn.q_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.self_attn.q_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.33.self_attn.v_proj.bias": "model-00034-of-00092.safetensors",
+ "model.layers.33.self_attn.v_proj.weight": "model-00034-of-00092.safetensors",
+ "model.layers.33.self_attn.v_proj.weight_scale": "model-00034-of-00092.safetensors",
+ "model.layers.34.input_layernorm.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.0.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.0.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.0.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.0.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.0.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.0.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.1.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.1.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.1.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.1.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.1.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.1.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.10.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.10.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.10.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.10.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.10.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.10.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.100.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.100.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.100.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.100.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.100.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.100.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.101.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.101.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.101.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.101.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.101.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.101.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.102.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.102.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.102.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.102.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.102.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.102.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.103.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.103.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.103.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.103.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.103.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.103.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.104.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.104.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.104.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.104.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.104.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.104.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.105.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.105.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.105.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.105.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.105.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.105.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.106.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.106.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.106.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.106.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.106.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.106.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.107.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.107.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.107.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.107.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.107.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.107.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.108.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.108.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.108.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.108.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.108.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.108.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.109.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.109.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.109.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.109.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.109.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.109.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.11.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.11.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.11.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.11.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.11.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.11.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.110.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.110.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.110.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.110.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.110.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.110.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.111.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.111.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.111.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.111.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.111.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.111.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.112.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.112.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.112.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.112.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.112.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.112.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.113.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.113.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.113.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.113.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.113.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.113.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.114.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.114.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.114.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.114.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.114.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.114.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.115.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.115.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.115.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.115.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.115.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.115.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.116.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.116.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.116.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.116.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.116.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.116.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.117.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.117.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.117.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.117.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.117.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.117.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.118.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.118.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.118.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.118.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.118.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.118.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.119.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.119.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.119.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.119.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.119.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.119.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.12.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.12.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.12.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.12.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.12.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.12.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.120.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.120.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.120.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.120.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.120.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.120.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.121.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.121.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.121.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.121.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.121.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.121.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.122.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.122.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.122.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.122.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.122.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.122.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.123.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.123.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.123.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.123.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.123.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.123.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.124.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.124.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.124.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.124.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.124.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.124.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.125.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.125.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.125.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.125.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.125.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.125.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.126.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.126.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.126.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.126.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.126.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.126.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.127.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.127.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.127.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.127.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.127.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.127.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.128.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.128.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.128.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.128.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.128.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.128.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.129.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.129.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.129.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.129.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.129.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.129.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.13.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.13.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.13.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.13.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.13.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.13.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.130.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.130.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.130.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.130.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.130.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.130.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.131.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.131.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.131.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.131.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.131.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.131.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.132.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.132.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.132.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.132.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.132.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.132.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.133.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.133.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.133.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.133.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.133.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.133.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.134.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.134.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.134.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.134.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.134.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.134.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.135.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.135.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.135.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.135.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.135.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.135.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.136.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.136.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.136.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.136.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.136.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.136.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.137.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.137.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.137.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.137.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.137.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.137.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.138.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.138.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.138.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.138.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.138.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.138.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.139.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.139.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.139.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.139.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.139.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.139.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.14.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.14.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.14.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.14.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.14.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.14.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.140.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.140.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.140.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.140.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.140.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.140.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.141.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.141.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.141.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.141.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.141.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.141.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.142.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.142.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.142.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.142.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.142.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.142.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.143.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.143.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.143.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.143.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.143.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.143.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.144.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.144.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.144.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.144.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.144.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.144.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.145.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.145.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.145.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.145.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.145.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.145.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.146.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.146.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.146.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.146.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.146.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.146.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.147.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.147.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.147.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.147.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.147.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.147.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.148.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.148.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.148.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.148.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.148.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.148.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.149.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.149.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.149.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.149.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.149.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.149.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.15.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.15.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.15.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.15.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.15.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.15.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.150.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.150.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.150.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.150.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.150.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.150.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.151.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.151.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.151.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.151.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.151.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.151.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.152.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.152.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.152.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.152.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.152.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.152.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.153.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.153.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.153.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.153.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.153.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.153.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.154.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.154.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.154.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.154.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.154.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.154.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.155.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.155.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.155.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.155.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.155.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.155.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.156.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.156.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.156.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.156.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.156.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.156.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.157.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.157.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.157.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.157.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.157.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.157.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.158.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.158.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.158.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.158.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.158.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.158.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.159.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.159.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.159.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.159.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.159.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.159.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.16.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.16.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.16.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.16.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.16.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.16.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.17.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.17.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.17.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.17.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.17.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.17.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.18.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.18.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.18.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.18.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.18.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.18.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.19.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.19.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.19.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.19.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.19.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.19.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.2.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.2.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.2.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.2.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.2.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.2.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.20.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.20.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.20.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.20.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.20.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.20.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.21.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.21.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.21.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.21.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.21.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.21.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.22.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.22.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.22.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.22.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.22.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.22.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.23.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.23.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.23.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.23.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.23.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.23.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.24.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.24.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.24.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.24.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.24.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.24.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.25.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.25.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.25.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.25.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.25.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.25.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.26.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.26.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.26.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.26.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.26.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.26.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.27.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.27.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.27.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.27.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.27.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.27.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.28.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.28.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.28.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.28.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.28.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.28.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.29.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.29.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.29.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.29.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.29.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.29.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.3.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.3.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.3.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.3.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.3.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.3.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.30.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.30.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.30.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.30.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.30.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.30.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.31.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.31.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.31.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.31.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.31.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.31.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.32.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.32.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.32.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.32.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.32.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.32.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.33.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.33.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.33.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.33.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.33.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.33.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.34.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.34.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.34.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.34.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.34.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.34.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.35.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.35.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.35.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.35.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.35.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.35.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.36.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.36.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.36.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.36.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.36.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.36.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.37.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.37.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.37.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.37.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.37.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.37.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.38.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.38.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.38.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.38.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.38.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.38.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.39.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.39.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.39.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.39.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.39.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.39.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.4.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.4.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.4.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.4.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.4.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.4.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.40.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.40.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.40.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.40.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.40.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.40.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.41.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.41.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.41.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.41.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.41.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.41.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.42.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.42.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.42.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.42.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.42.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.42.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.43.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.43.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.43.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.43.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.43.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.43.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.44.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.44.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.44.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.44.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.44.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.44.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.45.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.45.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.45.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.45.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.45.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.45.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.46.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.46.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.46.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.46.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.46.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.46.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.47.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.47.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.47.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.47.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.47.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.47.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.48.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.48.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.48.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.48.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.48.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.48.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.49.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.49.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.49.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.49.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.49.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.49.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.5.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.5.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.5.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.5.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.5.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.5.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.50.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.50.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.50.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.50.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.50.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.50.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.51.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.51.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.51.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.51.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.51.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.51.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.52.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.52.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.52.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.52.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.52.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.52.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.53.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.53.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.53.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.53.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.53.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.53.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.54.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.54.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.54.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.54.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.54.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.54.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.55.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.55.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.55.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.55.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.55.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.55.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.56.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.56.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.56.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.56.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.56.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.56.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.57.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.57.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.57.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.57.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.57.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.57.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.58.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.58.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.58.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.58.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.58.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.58.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.59.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.59.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.59.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.59.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.59.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.59.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.6.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.6.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.6.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.6.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.6.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.6.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.60.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.60.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.60.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.60.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.60.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.60.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.61.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.61.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.61.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.61.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.61.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.61.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.62.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.62.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.62.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.62.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.62.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.62.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.63.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.63.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.63.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.63.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.63.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.63.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.64.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.64.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.64.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.64.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.64.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.64.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.65.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.65.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.65.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.65.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.65.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.65.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.66.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.66.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.66.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.66.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.66.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.66.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.67.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.67.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.67.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.67.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.67.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.67.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.68.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.68.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.68.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.68.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.68.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.68.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.69.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.69.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.69.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.69.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.69.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.69.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.7.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.7.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.7.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.7.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.7.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.7.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.70.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.70.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.70.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.70.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.70.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.70.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.71.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.71.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.71.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.71.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.71.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.71.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.72.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.72.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.72.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.72.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.72.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.72.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.73.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.73.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.73.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.73.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.73.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.73.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.74.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.74.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.74.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.74.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.74.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.74.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.75.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.75.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.75.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.75.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.75.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.75.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.76.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.76.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.76.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.76.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.76.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.76.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.77.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.77.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.77.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.77.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.77.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.77.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.78.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.78.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.78.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.78.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.78.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.78.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.79.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.79.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.79.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.79.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.79.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.79.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.8.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.8.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.8.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.8.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.8.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.8.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.80.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.80.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.80.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.80.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.80.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.80.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.81.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.81.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.81.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.81.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.81.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.81.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.82.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.82.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.82.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.82.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.82.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.82.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.83.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.83.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.83.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.83.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.83.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.83.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.84.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.84.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.84.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.84.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.84.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.84.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.85.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.85.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.85.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.85.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.85.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.85.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.86.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.86.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.86.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.86.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.86.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.86.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.87.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.87.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.87.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.87.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.87.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.87.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.88.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.88.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.88.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.88.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.88.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.88.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.89.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.89.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.89.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.89.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.89.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.89.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.9.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.9.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.9.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.9.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.9.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.9.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.90.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.90.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.90.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.90.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.90.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.90.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.91.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.91.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.91.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.91.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.91.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.91.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.92.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.92.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.92.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.92.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.92.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.92.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.93.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.93.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.93.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.93.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.93.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.93.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.94.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.94.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.94.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.94.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.94.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.94.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.95.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.95.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.95.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.95.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.95.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.95.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.96.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.96.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.96.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.96.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.96.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.96.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.97.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.97.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.97.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.97.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.97.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.97.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.98.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.98.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.98.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.98.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.98.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.98.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.99.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.99.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.99.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.99.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.99.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.experts.99.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.gate.e_score_correction_bias": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.gate.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.shared_experts.down_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.shared_experts.down_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.shared_experts.gate_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.shared_experts.gate_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.shared_experts.up_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.mlp.shared_experts.up_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.post_attention_layernorm.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.self_attn.k_norm.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.self_attn.k_proj.bias": "model-00035-of-00092.safetensors",
+ "model.layers.34.self_attn.k_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.self_attn.k_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.self_attn.o_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.self_attn.o_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.self_attn.q_norm.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.self_attn.q_proj.bias": "model-00035-of-00092.safetensors",
+ "model.layers.34.self_attn.q_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.self_attn.q_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.34.self_attn.v_proj.bias": "model-00035-of-00092.safetensors",
+ "model.layers.34.self_attn.v_proj.weight": "model-00035-of-00092.safetensors",
+ "model.layers.34.self_attn.v_proj.weight_scale": "model-00035-of-00092.safetensors",
+ "model.layers.35.input_layernorm.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.0.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.0.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.0.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.0.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.0.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.0.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.1.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.1.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.1.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.1.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.1.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.1.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.10.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.10.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.10.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.10.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.10.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.10.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.100.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.100.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.100.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.100.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.100.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.100.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.101.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.101.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.101.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.101.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.101.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.101.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.102.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.102.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.102.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.102.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.102.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.102.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.103.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.103.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.103.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.103.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.103.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.103.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.104.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.104.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.104.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.104.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.104.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.104.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.105.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.105.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.105.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.105.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.105.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.105.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.106.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.106.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.106.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.106.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.106.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.106.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.107.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.107.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.107.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.107.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.107.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.107.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.108.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.108.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.108.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.108.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.108.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.108.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.109.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.109.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.109.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.109.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.109.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.109.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.11.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.11.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.11.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.11.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.11.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.11.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.110.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.110.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.110.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.110.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.110.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.110.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.111.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.111.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.111.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.111.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.111.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.111.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.112.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.112.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.112.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.112.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.112.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.112.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.113.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.113.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.113.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.113.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.113.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.113.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.114.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.114.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.114.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.114.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.114.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.114.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.115.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.115.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.115.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.115.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.115.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.115.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.116.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.116.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.116.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.116.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.116.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.116.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.117.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.117.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.117.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.117.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.117.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.117.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.118.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.118.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.118.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.118.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.118.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.118.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.119.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.119.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.119.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.119.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.119.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.119.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.12.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.12.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.12.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.12.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.12.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.12.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.120.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.120.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.120.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.120.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.120.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.120.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.121.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.121.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.121.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.121.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.121.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.121.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.122.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.122.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.122.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.122.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.122.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.122.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.123.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.123.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.123.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.123.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.123.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.123.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.124.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.124.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.124.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.124.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.124.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.124.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.125.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.125.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.125.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.125.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.125.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.125.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.126.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.126.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.126.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.126.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.126.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.126.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.127.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.127.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.127.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.127.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.127.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.127.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.128.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.128.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.128.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.128.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.128.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.128.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.129.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.129.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.129.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.129.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.129.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.129.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.13.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.13.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.13.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.13.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.13.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.13.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.130.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.130.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.130.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.130.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.130.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.130.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.131.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.131.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.131.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.131.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.131.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.131.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.132.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.132.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.132.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.132.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.132.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.132.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.133.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.133.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.133.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.133.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.133.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.133.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.134.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.134.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.134.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.134.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.134.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.134.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.135.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.135.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.135.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.135.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.135.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.135.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.136.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.136.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.136.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.136.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.136.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.136.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.137.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.137.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.137.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.137.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.137.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.137.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.138.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.138.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.138.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.138.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.138.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.138.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.139.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.139.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.139.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.139.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.139.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.139.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.14.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.14.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.14.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.14.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.14.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.14.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.140.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.140.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.140.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.140.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.140.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.140.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.141.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.141.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.141.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.141.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.141.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.141.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.142.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.142.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.142.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.142.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.142.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.142.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.143.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.143.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.143.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.143.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.143.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.143.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.144.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.144.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.144.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.144.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.144.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.144.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.145.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.145.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.145.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.145.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.145.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.145.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.146.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.146.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.146.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.146.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.146.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.146.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.147.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.147.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.147.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.147.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.147.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.147.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.148.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.148.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.148.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.148.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.148.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.148.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.149.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.149.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.149.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.149.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.149.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.149.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.15.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.15.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.15.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.15.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.15.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.15.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.150.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.150.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.150.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.150.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.150.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.150.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.151.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.151.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.151.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.151.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.151.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.151.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.152.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.152.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.152.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.152.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.152.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.152.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.153.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.153.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.153.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.153.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.153.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.153.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.154.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.154.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.154.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.154.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.154.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.154.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.155.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.155.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.155.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.155.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.155.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.155.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.156.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.156.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.156.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.156.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.156.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.156.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.157.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.157.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.157.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.157.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.157.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.157.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.158.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.158.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.158.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.158.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.158.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.158.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.159.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.159.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.159.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.159.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.159.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.159.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.16.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.16.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.16.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.16.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.16.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.16.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.17.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.17.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.17.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.17.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.17.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.17.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.18.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.18.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.18.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.18.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.18.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.18.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.19.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.19.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.19.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.19.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.19.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.19.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.2.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.2.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.2.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.2.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.2.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.2.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.20.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.20.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.20.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.20.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.20.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.20.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.21.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.21.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.21.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.21.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.21.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.21.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.22.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.22.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.22.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.22.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.22.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.22.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.23.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.23.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.23.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.23.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.23.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.23.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.24.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.24.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.24.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.24.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.24.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.24.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.25.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.25.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.25.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.25.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.25.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.25.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.26.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.26.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.26.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.26.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.26.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.26.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.27.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.27.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.27.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.27.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.27.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.27.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.28.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.28.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.28.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.28.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.28.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.28.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.29.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.29.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.29.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.29.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.29.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.29.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.3.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.3.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.3.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.3.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.3.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.3.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.30.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.30.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.30.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.30.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.30.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.30.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.31.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.31.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.31.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.31.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.31.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.31.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.32.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.32.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.32.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.32.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.32.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.32.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.33.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.33.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.33.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.33.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.33.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.33.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.34.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.34.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.34.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.34.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.34.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.34.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.35.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.35.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.35.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.35.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.35.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.35.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.36.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.36.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.36.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.36.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.36.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.36.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.37.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.37.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.37.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.37.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.37.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.37.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.38.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.38.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.38.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.38.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.38.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.38.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.39.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.39.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.39.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.39.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.39.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.39.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.4.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.4.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.4.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.4.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.4.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.4.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.40.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.40.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.40.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.40.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.40.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.40.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.41.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.41.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.41.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.41.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.41.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.41.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.42.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.42.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.42.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.42.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.42.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.42.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.43.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.43.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.43.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.43.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.43.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.43.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.44.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.44.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.44.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.44.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.44.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.44.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.45.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.45.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.45.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.45.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.45.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.45.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.46.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.46.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.46.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.46.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.46.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.46.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.47.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.47.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.47.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.47.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.47.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.47.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.48.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.48.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.48.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.48.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.48.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.48.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.49.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.49.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.49.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.49.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.49.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.49.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.5.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.5.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.5.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.5.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.5.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.5.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.50.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.50.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.50.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.50.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.50.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.50.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.51.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.51.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.51.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.51.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.51.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.51.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.52.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.52.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.52.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.52.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.52.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.52.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.53.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.53.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.53.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.53.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.53.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.53.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.54.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.54.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.54.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.54.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.54.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.54.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.55.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.55.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.55.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.55.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.55.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.55.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.56.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.56.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.56.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.56.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.56.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.56.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.57.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.57.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.57.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.57.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.57.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.57.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.58.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.58.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.58.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.58.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.58.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.58.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.59.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.59.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.59.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.59.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.59.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.59.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.6.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.6.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.6.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.6.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.6.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.6.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.60.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.60.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.60.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.60.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.60.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.60.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.61.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.61.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.61.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.61.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.61.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.61.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.62.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.62.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.62.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.62.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.62.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.62.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.63.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.63.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.63.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.63.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.63.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.63.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.64.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.64.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.64.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.64.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.64.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.64.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.65.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.65.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.65.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.65.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.65.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.65.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.66.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.66.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.66.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.66.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.66.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.66.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.67.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.67.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.67.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.67.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.67.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.67.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.68.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.68.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.68.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.68.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.68.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.68.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.69.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.69.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.69.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.69.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.69.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.69.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.7.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.7.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.7.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.7.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.7.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.7.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.70.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.70.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.70.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.70.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.70.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.70.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.71.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.71.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.71.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.71.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.71.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.71.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.72.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.72.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.72.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.72.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.72.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.72.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.73.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.73.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.73.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.73.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.73.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.73.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.74.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.74.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.74.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.74.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.74.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.74.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.75.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.75.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.75.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.75.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.75.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.75.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.76.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.76.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.76.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.76.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.76.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.76.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.77.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.77.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.77.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.77.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.77.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.77.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.78.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.78.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.78.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.78.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.78.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.78.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.79.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.79.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.79.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.79.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.79.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.79.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.8.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.8.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.8.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.8.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.8.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.8.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.80.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.80.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.80.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.80.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.80.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.80.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.81.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.81.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.81.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.81.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.81.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.81.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.82.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.82.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.82.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.82.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.82.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.82.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.83.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.83.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.83.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.83.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.83.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.83.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.84.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.84.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.84.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.84.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.84.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.84.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.85.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.85.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.85.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.85.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.85.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.85.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.86.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.86.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.86.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.86.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.86.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.86.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.87.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.87.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.87.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.87.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.87.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.87.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.88.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.88.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.88.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.88.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.88.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.88.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.89.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.89.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.89.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.89.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.89.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.89.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.9.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.9.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.9.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.9.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.9.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.9.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.90.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.90.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.90.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.90.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.90.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.90.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.91.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.91.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.91.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.91.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.91.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.91.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.92.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.92.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.92.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.92.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.92.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.92.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.93.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.93.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.93.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.93.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.93.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.93.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.94.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.94.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.94.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.94.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.94.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.94.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.95.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.95.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.95.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.95.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.95.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.95.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.96.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.96.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.96.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.96.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.96.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.96.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.97.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.97.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.97.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.97.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.97.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.97.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.98.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.98.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.98.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.98.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.98.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.98.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.99.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.99.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.99.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.99.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.99.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.experts.99.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.gate.e_score_correction_bias": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.gate.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.shared_experts.down_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.shared_experts.down_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.shared_experts.gate_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.shared_experts.gate_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.shared_experts.up_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.mlp.shared_experts.up_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.post_attention_layernorm.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.self_attn.k_norm.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.self_attn.k_proj.bias": "model-00036-of-00092.safetensors",
+ "model.layers.35.self_attn.k_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.self_attn.k_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.self_attn.o_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.self_attn.o_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.self_attn.q_norm.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.self_attn.q_proj.bias": "model-00036-of-00092.safetensors",
+ "model.layers.35.self_attn.q_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.self_attn.q_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.35.self_attn.v_proj.bias": "model-00036-of-00092.safetensors",
+ "model.layers.35.self_attn.v_proj.weight": "model-00036-of-00092.safetensors",
+ "model.layers.35.self_attn.v_proj.weight_scale": "model-00036-of-00092.safetensors",
+ "model.layers.36.input_layernorm.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.0.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.0.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.0.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.0.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.0.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.0.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.1.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.1.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.1.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.1.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.1.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.1.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.10.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.10.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.10.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.10.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.10.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.10.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.100.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.100.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.100.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.100.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.100.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.100.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.101.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.101.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.101.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.101.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.101.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.101.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.102.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.102.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.102.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.102.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.102.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.102.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.103.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.103.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.103.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.103.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.103.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.103.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.104.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.104.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.104.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.104.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.104.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.104.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.105.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.105.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.105.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.105.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.105.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.105.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.106.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.106.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.106.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.106.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.106.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.106.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.107.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.107.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.107.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.107.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.107.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.107.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.108.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.108.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.108.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.108.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.108.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.108.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.109.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.109.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.109.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.109.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.109.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.109.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.11.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.11.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.11.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.11.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.11.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.11.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.110.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.110.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.110.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.110.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.110.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.110.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.111.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.111.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.111.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.111.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.111.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.111.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.112.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.112.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.112.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.112.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.112.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.112.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.113.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.113.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.113.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.113.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.113.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.113.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.114.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.114.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.114.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.114.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.114.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.114.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.115.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.115.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.115.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.115.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.115.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.115.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.116.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.116.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.116.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.116.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.116.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.116.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.117.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.117.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.117.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.117.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.117.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.117.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.118.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.118.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.118.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.118.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.118.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.118.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.119.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.119.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.119.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.119.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.119.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.119.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.12.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.12.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.12.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.12.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.12.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.12.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.120.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.120.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.120.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.120.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.120.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.120.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.121.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.121.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.121.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.121.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.121.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.121.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.122.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.122.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.122.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.122.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.122.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.122.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.123.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.123.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.123.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.123.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.123.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.123.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.124.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.124.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.124.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.124.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.124.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.124.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.125.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.125.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.125.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.125.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.125.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.125.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.126.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.126.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.126.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.126.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.126.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.126.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.127.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.127.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.127.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.127.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.127.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.127.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.128.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.128.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.128.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.128.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.128.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.128.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.129.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.129.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.129.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.129.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.129.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.129.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.13.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.13.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.13.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.13.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.13.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.13.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.130.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.130.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.130.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.130.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.130.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.130.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.131.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.131.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.131.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.131.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.131.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.131.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.132.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.132.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.132.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.132.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.132.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.132.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.133.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.133.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.133.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.133.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.133.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.133.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.134.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.134.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.134.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.134.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.134.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.134.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.135.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.135.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.135.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.135.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.135.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.135.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.136.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.136.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.136.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.136.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.136.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.136.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.137.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.137.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.137.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.137.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.137.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.137.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.138.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.138.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.138.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.138.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.138.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.138.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.139.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.139.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.139.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.139.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.139.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.139.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.14.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.14.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.14.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.14.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.14.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.14.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.140.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.140.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.140.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.140.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.140.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.140.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.141.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.141.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.141.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.141.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.141.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.141.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.142.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.142.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.142.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.142.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.142.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.142.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.143.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.143.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.143.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.143.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.143.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.143.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.144.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.144.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.144.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.144.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.144.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.144.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.145.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.145.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.145.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.145.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.145.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.145.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.146.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.146.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.146.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.146.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.146.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.146.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.147.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.147.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.147.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.147.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.147.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.147.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.148.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.148.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.148.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.148.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.148.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.148.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.149.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.149.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.149.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.149.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.149.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.149.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.15.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.15.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.15.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.15.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.15.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.15.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.150.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.150.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.150.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.150.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.150.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.150.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.151.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.151.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.151.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.151.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.151.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.151.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.152.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.152.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.152.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.152.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.152.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.152.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.153.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.153.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.153.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.153.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.153.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.153.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.154.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.154.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.154.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.154.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.154.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.154.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.155.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.155.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.155.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.155.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.155.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.155.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.156.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.156.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.156.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.156.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.156.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.156.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.157.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.157.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.157.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.157.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.157.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.157.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.158.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.158.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.158.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.158.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.158.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.158.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.159.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.159.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.159.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.159.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.159.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.159.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.16.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.16.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.16.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.16.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.16.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.16.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.17.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.17.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.17.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.17.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.17.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.17.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.18.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.18.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.18.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.18.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.18.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.18.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.19.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.19.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.19.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.19.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.19.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.19.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.2.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.2.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.2.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.2.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.2.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.2.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.20.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.20.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.20.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.20.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.20.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.20.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.21.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.21.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.21.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.21.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.21.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.21.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.22.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.22.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.22.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.22.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.22.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.22.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.23.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.23.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.23.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.23.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.23.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.23.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.24.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.24.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.24.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.24.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.24.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.24.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.25.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.25.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.25.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.25.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.25.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.25.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.26.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.26.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.26.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.26.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.26.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.26.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.27.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.27.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.27.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.27.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.27.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.27.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.28.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.28.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.28.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.28.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.28.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.28.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.29.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.29.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.29.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.29.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.29.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.29.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.3.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.3.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.3.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.3.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.3.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.3.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.30.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.30.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.30.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.30.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.30.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.30.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.31.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.31.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.31.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.31.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.31.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.31.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.32.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.32.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.32.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.32.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.32.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.32.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.33.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.33.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.33.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.33.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.33.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.33.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.34.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.34.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.34.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.34.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.34.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.34.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.35.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.35.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.35.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.35.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.35.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.35.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.36.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.36.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.36.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.36.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.36.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.36.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.37.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.37.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.37.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.37.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.37.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.37.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.38.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.38.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.38.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.38.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.38.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.38.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.39.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.39.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.39.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.39.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.39.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.39.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.4.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.4.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.4.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.4.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.4.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.4.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.40.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.40.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.40.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.40.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.40.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.40.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.41.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.41.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.41.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.41.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.41.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.41.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.42.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.42.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.42.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.42.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.42.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.42.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.43.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.43.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.43.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.43.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.43.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.43.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.44.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.44.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.44.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.44.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.44.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.44.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.45.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.45.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.45.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.45.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.45.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.45.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.46.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.46.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.46.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.46.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.46.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.46.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.47.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.47.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.47.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.47.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.47.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.47.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.48.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.48.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.48.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.48.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.48.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.48.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.49.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.49.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.49.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.49.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.49.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.49.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.5.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.5.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.5.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.5.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.5.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.5.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.50.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.50.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.50.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.50.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.50.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.50.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.51.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.51.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.51.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.51.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.51.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.51.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.52.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.52.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.52.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.52.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.52.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.52.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.53.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.53.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.53.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.53.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.53.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.53.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.54.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.54.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.54.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.54.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.54.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.54.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.55.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.55.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.55.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.55.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.55.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.55.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.56.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.56.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.56.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.56.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.56.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.56.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.57.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.57.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.57.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.57.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.57.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.57.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.58.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.58.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.58.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.58.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.58.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.58.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.59.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.59.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.59.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.59.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.59.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.59.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.6.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.6.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.6.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.6.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.6.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.6.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.60.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.60.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.60.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.60.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.60.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.60.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.61.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.61.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.61.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.61.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.61.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.61.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.62.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.62.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.62.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.62.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.62.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.62.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.63.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.63.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.63.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.63.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.63.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.63.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.64.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.64.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.64.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.64.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.64.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.64.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.65.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.65.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.65.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.65.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.65.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.65.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.66.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.66.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.66.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.66.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.66.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.66.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.67.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.67.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.67.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.67.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.67.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.67.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.68.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.68.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.68.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.68.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.68.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.68.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.69.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.69.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.69.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.69.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.69.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.69.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.7.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.7.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.7.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.7.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.7.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.7.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.70.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.70.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.70.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.70.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.70.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.70.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.71.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.71.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.71.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.71.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.71.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.71.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.72.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.72.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.72.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.72.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.72.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.72.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.73.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.73.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.73.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.73.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.73.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.73.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.74.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.74.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.74.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.74.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.74.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.74.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.75.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.75.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.75.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.75.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.75.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.75.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.76.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.76.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.76.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.76.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.76.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.76.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.77.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.77.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.77.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.77.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.77.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.77.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.78.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.78.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.78.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.78.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.78.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.78.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.79.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.79.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.79.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.79.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.79.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.79.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.8.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.8.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.8.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.8.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.8.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.8.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.80.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.80.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.80.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.80.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.80.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.80.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.81.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.81.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.81.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.81.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.81.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.81.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.82.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.82.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.82.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.82.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.82.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.82.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.83.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.83.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.83.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.83.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.83.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.83.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.84.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.84.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.84.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.84.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.84.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.84.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.85.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.85.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.85.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.85.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.85.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.85.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.86.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.86.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.86.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.86.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.86.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.86.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.87.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.87.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.87.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.87.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.87.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.87.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.88.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.88.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.88.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.88.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.88.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.88.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.89.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.89.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.89.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.89.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.89.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.89.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.9.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.9.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.9.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.9.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.9.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.9.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.90.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.90.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.90.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.90.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.90.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.90.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.91.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.91.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.91.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.91.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.91.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.91.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.92.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.92.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.92.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.92.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.92.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.92.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.93.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.93.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.93.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.93.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.93.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.93.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.94.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.94.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.94.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.94.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.94.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.94.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.95.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.95.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.95.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.95.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.95.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.95.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.96.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.96.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.96.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.96.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.96.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.96.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.97.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.97.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.97.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.97.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.97.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.97.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.98.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.98.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.98.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.98.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.98.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.98.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.99.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.99.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.99.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.99.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.99.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.experts.99.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.gate.e_score_correction_bias": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.gate.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.shared_experts.down_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.shared_experts.down_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.shared_experts.gate_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.shared_experts.gate_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.shared_experts.up_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.mlp.shared_experts.up_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.post_attention_layernorm.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.self_attn.k_norm.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.self_attn.k_proj.bias": "model-00037-of-00092.safetensors",
+ "model.layers.36.self_attn.k_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.self_attn.k_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.self_attn.o_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.self_attn.o_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.self_attn.q_norm.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.self_attn.q_proj.bias": "model-00037-of-00092.safetensors",
+ "model.layers.36.self_attn.q_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.self_attn.q_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.36.self_attn.v_proj.bias": "model-00037-of-00092.safetensors",
+ "model.layers.36.self_attn.v_proj.weight": "model-00037-of-00092.safetensors",
+ "model.layers.36.self_attn.v_proj.weight_scale": "model-00037-of-00092.safetensors",
+ "model.layers.37.input_layernorm.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.0.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.0.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.0.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.0.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.0.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.0.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.1.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.1.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.1.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.1.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.1.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.1.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.10.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.10.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.10.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.10.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.10.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.10.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.100.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.100.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.100.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.100.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.100.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.100.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.101.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.101.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.101.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.101.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.101.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.101.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.102.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.102.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.102.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.102.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.102.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.102.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.103.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.103.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.103.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.103.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.103.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.103.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.104.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.104.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.104.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.104.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.104.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.104.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.105.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.105.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.105.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.105.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.105.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.105.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.106.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.106.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.106.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.106.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.106.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.106.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.107.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.107.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.107.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.107.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.107.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.107.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.108.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.108.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.108.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.108.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.108.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.108.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.109.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.109.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.109.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.109.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.109.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.109.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.11.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.11.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.11.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.11.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.11.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.11.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.110.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.110.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.110.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.110.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.110.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.110.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.111.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.111.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.111.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.111.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.111.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.111.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.112.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.112.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.112.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.112.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.112.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.112.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.113.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.113.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.113.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.113.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.113.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.113.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.114.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.114.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.114.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.114.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.114.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.114.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.115.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.115.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.115.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.115.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.115.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.115.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.116.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.116.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.116.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.116.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.116.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.116.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.117.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.117.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.117.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.117.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.117.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.117.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.118.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.118.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.118.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.118.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.118.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.118.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.119.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.119.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.119.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.119.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.119.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.119.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.12.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.12.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.12.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.12.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.12.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.12.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.120.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.120.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.120.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.120.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.120.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.120.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.121.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.121.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.121.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.121.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.121.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.121.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.122.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.122.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.122.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.122.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.122.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.122.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.123.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.123.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.123.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.123.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.123.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.123.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.124.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.124.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.124.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.124.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.124.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.124.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.125.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.125.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.125.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.125.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.125.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.125.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.126.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.126.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.126.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.126.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.126.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.126.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.127.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.127.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.127.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.127.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.127.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.127.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.128.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.128.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.128.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.128.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.128.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.128.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.129.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.129.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.129.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.129.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.129.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.129.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.13.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.13.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.13.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.13.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.13.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.13.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.130.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.130.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.130.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.130.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.130.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.130.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.131.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.131.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.131.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.131.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.131.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.131.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.132.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.132.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.132.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.132.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.132.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.132.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.133.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.133.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.133.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.133.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.133.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.133.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.134.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.134.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.134.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.134.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.134.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.134.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.135.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.135.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.135.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.135.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.135.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.135.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.136.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.136.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.136.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.136.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.136.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.136.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.137.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.137.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.137.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.137.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.137.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.137.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.138.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.138.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.138.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.138.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.138.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.138.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.139.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.139.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.139.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.139.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.139.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.139.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.14.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.14.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.14.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.14.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.14.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.14.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.140.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.140.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.140.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.140.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.140.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.140.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.141.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.141.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.141.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.141.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.141.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.141.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.142.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.142.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.142.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.142.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.142.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.142.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.143.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.143.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.143.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.143.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.143.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.143.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.144.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.144.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.144.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.144.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.144.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.144.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.145.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.145.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.145.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.145.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.145.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.145.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.146.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.146.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.146.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.146.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.146.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.146.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.147.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.147.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.147.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.147.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.147.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.147.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.148.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.148.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.148.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.148.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.148.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.148.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.149.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.149.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.149.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.149.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.149.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.149.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.15.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.15.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.15.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.15.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.15.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.15.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.150.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.150.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.150.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.150.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.150.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.150.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.151.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.151.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.151.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.151.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.151.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.151.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.152.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.152.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.152.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.152.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.152.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.152.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.153.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.153.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.153.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.153.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.153.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.153.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.154.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.154.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.154.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.154.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.154.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.154.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.155.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.155.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.155.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.155.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.155.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.155.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.156.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.156.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.156.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.156.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.156.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.156.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.157.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.157.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.157.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.157.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.157.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.157.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.158.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.158.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.158.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.158.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.158.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.158.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.159.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.159.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.159.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.159.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.159.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.159.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.16.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.16.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.16.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.16.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.16.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.16.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.17.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.17.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.17.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.17.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.17.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.17.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.18.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.18.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.18.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.18.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.18.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.18.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.19.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.19.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.19.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.19.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.19.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.19.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.2.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.2.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.2.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.2.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.2.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.2.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.20.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.20.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.20.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.20.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.20.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.20.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.21.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.21.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.21.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.21.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.21.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.21.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.22.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.22.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.22.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.22.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.22.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.22.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.23.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.23.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.23.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.23.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.23.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.23.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.24.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.24.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.24.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.24.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.24.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.24.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.25.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.25.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.25.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.25.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.25.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.25.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.26.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.26.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.26.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.26.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.26.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.26.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.27.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.27.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.27.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.27.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.27.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.27.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.28.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.28.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.28.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.28.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.28.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.28.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.29.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.29.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.29.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.29.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.29.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.29.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.3.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.3.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.3.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.3.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.3.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.3.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.30.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.30.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.30.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.30.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.30.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.30.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.31.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.31.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.31.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.31.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.31.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.31.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.32.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.32.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.32.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.32.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.32.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.32.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.33.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.33.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.33.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.33.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.33.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.33.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.34.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.34.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.34.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.34.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.34.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.34.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.35.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.35.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.35.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.35.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.35.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.35.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.36.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.36.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.36.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.36.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.36.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.36.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.37.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.37.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.37.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.37.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.37.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.37.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.38.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.38.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.38.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.38.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.38.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.38.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.39.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.39.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.39.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.39.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.39.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.39.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.4.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.4.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.4.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.4.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.4.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.4.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.40.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.40.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.40.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.40.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.40.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.40.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.41.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.41.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.41.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.41.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.41.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.41.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.42.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.42.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.42.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.42.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.42.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.42.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.43.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.43.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.43.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.43.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.43.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.43.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.44.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.44.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.44.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.44.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.44.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.44.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.45.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.45.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.45.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.45.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.45.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.45.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.46.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.46.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.46.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.46.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.46.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.46.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.47.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.47.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.47.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.47.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.47.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.47.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.48.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.48.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.48.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.48.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.48.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.48.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.49.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.49.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.49.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.49.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.49.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.49.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.5.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.5.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.5.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.5.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.5.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.5.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.50.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.50.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.50.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.50.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.50.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.50.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.51.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.51.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.51.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.51.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.51.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.51.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.52.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.52.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.52.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.52.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.52.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.52.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.53.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.53.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.53.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.53.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.53.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.53.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.54.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.54.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.54.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.54.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.54.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.54.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.55.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.55.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.55.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.55.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.55.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.55.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.56.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.56.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.56.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.56.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.56.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.56.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.57.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.57.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.57.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.57.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.57.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.57.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.58.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.58.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.58.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.58.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.58.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.58.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.59.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.59.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.59.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.59.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.59.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.59.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.6.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.6.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.6.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.6.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.6.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.6.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.60.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.60.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.60.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.60.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.60.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.60.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.61.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.61.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.61.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.61.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.61.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.61.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.62.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.62.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.62.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.62.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.62.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.62.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.63.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.63.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.63.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.63.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.63.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.63.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.64.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.64.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.64.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.64.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.64.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.64.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.65.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.65.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.65.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.65.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.65.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.65.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.66.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.66.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.66.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.66.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.66.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.66.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.67.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.67.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.67.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.67.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.67.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.67.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.68.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.68.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.68.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.68.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.68.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.68.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.69.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.69.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.69.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.69.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.69.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.69.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.7.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.7.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.7.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.7.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.7.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.7.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.70.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.70.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.70.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.70.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.70.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.70.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.71.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.71.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.71.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.71.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.71.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.71.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.72.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.72.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.72.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.72.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.72.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.72.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.73.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.73.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.73.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.73.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.73.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.73.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.74.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.74.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.74.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.74.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.74.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.74.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.75.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.75.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.75.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.75.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.75.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.75.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.76.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.76.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.76.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.76.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.76.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.76.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.77.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.77.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.77.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.77.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.77.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.77.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.78.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.78.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.78.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.78.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.78.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.78.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.79.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.79.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.79.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.79.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.79.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.79.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.8.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.8.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.8.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.8.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.8.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.8.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.80.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.80.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.80.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.80.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.80.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.80.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.81.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.81.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.81.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.81.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.81.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.81.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.82.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.82.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.82.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.82.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.82.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.82.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.83.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.83.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.83.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.83.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.83.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.83.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.84.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.84.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.84.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.84.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.84.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.84.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.85.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.85.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.85.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.85.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.85.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.85.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.86.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.86.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.86.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.86.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.86.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.86.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.87.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.87.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.87.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.87.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.87.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.87.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.88.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.88.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.88.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.88.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.88.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.88.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.89.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.89.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.89.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.89.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.89.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.89.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.9.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.9.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.9.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.9.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.9.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.9.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.90.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.90.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.90.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.90.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.90.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.90.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.91.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.91.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.91.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.91.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.91.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.91.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.92.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.92.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.92.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.92.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.92.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.92.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.93.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.93.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.93.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.93.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.93.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.93.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.94.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.94.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.94.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.94.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.94.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.94.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.95.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.95.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.95.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.95.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.95.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.95.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.96.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.96.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.96.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.96.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.96.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.96.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.97.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.97.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.97.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.97.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.97.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.97.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.98.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.98.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.98.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.98.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.98.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.98.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.99.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.99.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.99.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.99.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.99.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.experts.99.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.gate.e_score_correction_bias": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.gate.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.shared_experts.down_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.shared_experts.down_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.shared_experts.gate_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.shared_experts.gate_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.shared_experts.up_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.mlp.shared_experts.up_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.post_attention_layernorm.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.self_attn.k_norm.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.self_attn.k_proj.bias": "model-00038-of-00092.safetensors",
+ "model.layers.37.self_attn.k_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.self_attn.k_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.self_attn.o_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.self_attn.o_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.self_attn.q_norm.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.self_attn.q_proj.bias": "model-00038-of-00092.safetensors",
+ "model.layers.37.self_attn.q_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.self_attn.q_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.37.self_attn.v_proj.bias": "model-00038-of-00092.safetensors",
+ "model.layers.37.self_attn.v_proj.weight": "model-00038-of-00092.safetensors",
+ "model.layers.37.self_attn.v_proj.weight_scale": "model-00038-of-00092.safetensors",
+ "model.layers.38.input_layernorm.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.0.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.0.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.0.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.0.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.0.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.0.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.1.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.1.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.1.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.1.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.1.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.1.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.10.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.10.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.10.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.10.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.10.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.10.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.100.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.100.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.100.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.100.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.100.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.100.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.101.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.101.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.101.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.101.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.101.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.101.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.102.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.102.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.102.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.102.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.102.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.102.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.103.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.103.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.103.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.103.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.103.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.103.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.104.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.104.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.104.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.104.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.104.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.104.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.105.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.105.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.105.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.105.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.105.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.105.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.106.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.106.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.106.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.106.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.106.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.106.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.107.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.107.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.107.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.107.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.107.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.107.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.108.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.108.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.108.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.108.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.108.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.108.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.109.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.109.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.109.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.109.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.109.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.109.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.11.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.11.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.11.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.11.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.11.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.11.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.110.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.110.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.110.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.110.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.110.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.110.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.111.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.111.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.111.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.111.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.111.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.111.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.112.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.112.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.112.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.112.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.112.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.112.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.113.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.113.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.113.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.113.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.113.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.113.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.114.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.114.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.114.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.114.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.114.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.114.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.115.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.115.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.115.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.115.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.115.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.115.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.116.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.116.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.116.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.116.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.116.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.116.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.117.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.117.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.117.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.117.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.117.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.117.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.118.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.118.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.118.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.118.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.118.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.118.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.119.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.119.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.119.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.119.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.119.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.119.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.12.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.12.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.12.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.12.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.12.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.12.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.120.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.120.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.120.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.120.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.120.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.120.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.121.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.121.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.121.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.121.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.121.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.121.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.122.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.122.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.122.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.122.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.122.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.122.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.123.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.123.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.123.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.123.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.123.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.123.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.124.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.124.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.124.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.124.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.124.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.124.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.125.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.125.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.125.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.125.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.125.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.125.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.126.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.126.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.126.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.126.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.126.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.126.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.127.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.127.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.127.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.127.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.127.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.127.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.128.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.128.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.128.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.128.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.128.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.128.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.129.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.129.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.129.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.129.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.129.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.129.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.13.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.13.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.13.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.13.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.13.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.13.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.130.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.130.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.130.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.130.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.130.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.130.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.131.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.131.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.131.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.131.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.131.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.131.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.132.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.132.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.132.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.132.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.132.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.132.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.133.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.133.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.133.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.133.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.133.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.133.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.134.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.134.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.134.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.134.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.134.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.134.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.135.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.135.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.135.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.135.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.135.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.135.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.136.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.136.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.136.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.136.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.136.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.136.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.137.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.137.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.137.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.137.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.137.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.137.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.138.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.138.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.138.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.138.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.138.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.138.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.139.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.139.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.139.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.139.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.139.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.139.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.14.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.14.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.14.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.14.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.14.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.14.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.140.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.140.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.140.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.140.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.140.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.140.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.141.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.141.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.141.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.141.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.141.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.141.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.142.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.142.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.142.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.142.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.142.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.142.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.143.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.143.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.143.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.143.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.143.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.143.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.144.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.144.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.144.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.144.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.144.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.144.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.145.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.145.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.145.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.145.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.145.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.145.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.146.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.146.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.146.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.146.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.146.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.146.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.147.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.147.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.147.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.147.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.147.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.147.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.148.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.148.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.148.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.148.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.148.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.148.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.149.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.149.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.149.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.149.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.149.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.149.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.15.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.15.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.15.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.15.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.15.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.15.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.150.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.150.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.150.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.150.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.150.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.150.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.151.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.151.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.151.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.151.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.151.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.151.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.152.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.152.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.152.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.152.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.152.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.152.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.153.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.153.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.153.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.153.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.153.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.153.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.154.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.154.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.154.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.154.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.154.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.154.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.155.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.155.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.155.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.155.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.155.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.155.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.156.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.156.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.156.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.156.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.156.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.156.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.157.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.157.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.157.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.157.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.157.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.157.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.158.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.158.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.158.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.158.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.158.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.158.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.159.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.159.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.159.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.159.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.159.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.159.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.16.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.16.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.16.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.16.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.16.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.16.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.17.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.17.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.17.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.17.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.17.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.17.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.18.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.18.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.18.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.18.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.18.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.18.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.19.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.19.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.19.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.19.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.19.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.19.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.2.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.2.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.2.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.2.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.2.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.2.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.20.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.20.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.20.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.20.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.20.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.20.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.21.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.21.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.21.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.21.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.21.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.21.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.22.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.22.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.22.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.22.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.22.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.22.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.23.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.23.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.23.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.23.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.23.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.23.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.24.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.24.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.24.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.24.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.24.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.24.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.25.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.25.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.25.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.25.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.25.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.25.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.26.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.26.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.26.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.26.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.26.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.26.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.27.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.27.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.27.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.27.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.27.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.27.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.28.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.28.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.28.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.28.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.28.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.28.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.29.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.29.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.29.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.29.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.29.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.29.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.3.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.3.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.3.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.3.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.3.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.3.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.30.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.30.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.30.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.30.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.30.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.30.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.31.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.31.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.31.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.31.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.31.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.31.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.32.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.32.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.32.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.32.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.32.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.32.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.33.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.33.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.33.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.33.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.33.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.33.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.34.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.34.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.34.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.34.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.34.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.34.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.35.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.35.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.35.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.35.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.35.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.35.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.36.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.36.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.36.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.36.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.36.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.36.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.37.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.37.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.37.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.37.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.37.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.37.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.38.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.38.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.38.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.38.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.38.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.38.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.39.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.39.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.39.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.39.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.39.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.39.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.4.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.4.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.4.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.4.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.4.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.4.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.40.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.40.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.40.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.40.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.40.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.40.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.41.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.41.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.41.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.41.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.41.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.41.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.42.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.42.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.42.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.42.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.42.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.42.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.43.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.43.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.43.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.43.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.43.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.43.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.44.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.44.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.44.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.44.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.44.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.44.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.45.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.45.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.45.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.45.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.45.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.45.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.46.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.46.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.46.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.46.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.46.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.46.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.47.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.47.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.47.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.47.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.47.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.47.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.48.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.48.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.48.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.48.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.48.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.48.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.49.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.49.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.49.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.49.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.49.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.49.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.5.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.5.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.5.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.5.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.5.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.5.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.50.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.50.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.50.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.50.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.50.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.50.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.51.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.51.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.51.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.51.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.51.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.51.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.52.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.52.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.52.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.52.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.52.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.52.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.53.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.53.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.53.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.53.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.53.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.53.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.54.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.54.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.54.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.54.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.54.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.54.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.55.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.55.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.55.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.55.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.55.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.55.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.56.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.56.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.56.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.56.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.56.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.56.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.57.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.57.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.57.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.57.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.57.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.57.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.58.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.58.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.58.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.58.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.58.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.58.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.59.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.59.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.59.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.59.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.59.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.59.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.6.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.6.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.6.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.6.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.6.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.6.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.60.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.60.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.60.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.60.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.60.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.60.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.61.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.61.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.61.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.61.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.61.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.61.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.62.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.62.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.62.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.62.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.62.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.62.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.63.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.63.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.63.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.63.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.63.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.63.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.64.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.64.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.64.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.64.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.64.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.64.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.65.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.65.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.65.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.65.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.65.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.65.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.66.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.66.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.66.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.66.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.66.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.66.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.67.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.67.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.67.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.67.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.67.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.67.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.68.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.68.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.68.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.68.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.68.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.68.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.69.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.69.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.69.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.69.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.69.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.69.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.7.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.7.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.7.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.7.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.7.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.7.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.70.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.70.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.70.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.70.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.70.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.70.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.71.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.71.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.71.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.71.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.71.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.71.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.72.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.72.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.72.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.72.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.72.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.72.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.73.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.73.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.73.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.73.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.73.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.73.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.74.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.74.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.74.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.74.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.74.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.74.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.75.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.75.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.75.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.75.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.75.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.75.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.76.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.76.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.76.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.76.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.76.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.76.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.77.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.77.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.77.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.77.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.77.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.77.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.78.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.78.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.78.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.78.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.78.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.78.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.79.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.79.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.79.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.79.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.79.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.79.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.8.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.8.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.8.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.8.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.8.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.8.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.80.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.80.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.80.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.80.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.80.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.80.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.81.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.81.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.81.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.81.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.81.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.81.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.82.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.82.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.82.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.82.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.82.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.82.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.83.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.83.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.83.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.83.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.83.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.83.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.84.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.84.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.84.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.84.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.84.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.84.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.85.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.85.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.85.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.85.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.85.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.85.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.86.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.86.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.86.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.86.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.86.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.86.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.87.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.87.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.87.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.87.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.87.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.87.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.88.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.88.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.88.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.88.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.88.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.88.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.89.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.89.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.89.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.89.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.89.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.89.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.9.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.9.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.9.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.9.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.9.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.9.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.90.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.90.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.90.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.90.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.90.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.90.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.91.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.91.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.91.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.91.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.91.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.91.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.92.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.92.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.92.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.92.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.92.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.92.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.93.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.93.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.93.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.93.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.93.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.93.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.94.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.94.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.94.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.94.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.94.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.94.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.95.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.95.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.95.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.95.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.95.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.95.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.96.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.96.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.96.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.96.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.96.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.96.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.97.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.97.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.97.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.97.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.97.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.97.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.98.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.98.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.98.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.98.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.98.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.98.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.99.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.99.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.99.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.99.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.99.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.experts.99.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.gate.e_score_correction_bias": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.gate.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.shared_experts.down_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.shared_experts.down_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.shared_experts.gate_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.shared_experts.gate_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.shared_experts.up_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.mlp.shared_experts.up_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.post_attention_layernorm.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.self_attn.k_norm.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.self_attn.k_proj.bias": "model-00039-of-00092.safetensors",
+ "model.layers.38.self_attn.k_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.self_attn.k_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.self_attn.o_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.self_attn.o_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.self_attn.q_norm.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.self_attn.q_proj.bias": "model-00039-of-00092.safetensors",
+ "model.layers.38.self_attn.q_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.self_attn.q_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.38.self_attn.v_proj.bias": "model-00039-of-00092.safetensors",
+ "model.layers.38.self_attn.v_proj.weight": "model-00039-of-00092.safetensors",
+ "model.layers.38.self_attn.v_proj.weight_scale": "model-00039-of-00092.safetensors",
+ "model.layers.39.input_layernorm.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.0.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.0.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.0.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.0.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.0.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.0.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.1.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.1.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.1.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.1.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.1.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.1.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.10.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.10.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.10.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.10.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.10.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.10.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.100.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.100.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.100.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.100.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.100.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.100.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.101.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.101.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.101.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.101.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.101.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.101.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.102.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.102.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.102.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.102.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.102.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.102.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.103.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.103.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.103.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.103.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.103.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.103.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.104.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.104.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.104.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.104.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.104.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.104.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.105.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.105.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.105.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.105.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.105.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.105.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.106.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.106.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.106.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.106.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.106.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.106.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.107.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.107.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.107.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.107.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.107.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.107.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.108.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.108.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.108.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.108.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.108.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.108.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.109.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.109.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.109.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.109.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.109.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.109.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.11.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.11.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.11.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.11.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.11.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.11.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.110.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.110.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.110.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.110.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.110.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.110.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.111.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.111.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.111.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.111.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.111.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.111.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.112.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.112.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.112.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.112.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.112.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.112.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.113.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.113.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.113.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.113.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.113.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.113.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.114.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.114.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.114.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.114.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.114.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.114.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.115.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.115.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.115.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.115.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.115.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.115.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.116.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.116.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.116.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.116.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.116.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.116.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.117.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.117.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.117.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.117.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.117.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.117.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.118.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.118.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.118.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.118.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.118.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.118.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.119.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.119.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.119.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.119.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.119.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.119.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.12.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.12.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.12.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.12.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.12.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.12.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.120.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.120.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.120.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.120.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.120.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.120.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.121.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.121.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.121.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.121.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.121.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.121.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.122.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.122.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.122.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.122.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.122.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.122.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.123.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.123.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.123.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.123.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.123.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.123.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.124.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.124.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.124.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.124.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.124.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.124.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.125.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.125.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.125.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.125.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.125.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.125.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.126.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.126.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.126.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.126.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.126.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.126.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.127.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.127.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.127.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.127.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.127.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.127.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.128.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.128.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.128.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.128.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.128.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.128.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.129.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.129.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.129.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.129.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.129.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.129.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.13.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.13.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.13.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.13.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.13.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.13.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.130.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.130.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.130.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.130.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.130.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.130.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.131.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.131.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.131.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.131.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.131.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.131.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.132.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.132.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.132.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.132.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.132.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.132.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.133.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.133.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.133.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.133.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.133.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.133.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.134.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.134.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.134.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.134.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.134.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.134.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.135.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.135.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.135.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.135.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.135.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.135.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.136.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.136.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.136.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.136.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.136.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.136.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.137.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.137.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.137.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.137.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.137.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.137.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.138.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.138.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.138.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.138.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.138.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.138.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.139.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.139.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.139.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.139.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.139.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.139.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.14.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.14.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.14.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.14.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.14.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.14.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.140.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.140.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.140.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.140.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.140.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.140.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.141.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.141.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.141.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.141.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.141.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.141.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.142.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.142.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.142.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.142.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.142.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.142.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.143.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.143.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.143.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.143.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.143.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.143.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.144.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.144.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.144.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.144.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.144.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.144.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.145.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.145.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.145.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.145.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.145.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.145.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.146.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.146.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.146.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.146.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.146.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.146.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.147.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.147.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.147.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.147.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.147.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.147.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.148.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.148.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.148.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.148.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.148.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.148.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.149.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.149.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.149.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.149.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.149.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.149.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.15.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.15.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.15.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.15.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.15.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.15.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.150.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.150.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.150.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.150.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.150.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.150.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.151.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.151.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.151.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.151.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.151.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.151.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.152.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.152.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.152.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.152.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.152.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.152.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.153.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.153.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.153.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.153.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.153.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.153.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.154.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.154.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.154.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.154.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.154.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.154.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.155.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.155.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.155.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.155.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.155.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.155.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.156.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.156.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.156.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.156.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.156.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.156.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.157.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.157.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.157.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.157.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.157.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.157.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.158.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.158.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.158.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.158.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.158.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.158.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.159.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.159.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.159.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.159.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.159.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.159.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.16.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.16.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.16.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.16.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.16.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.16.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.17.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.17.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.17.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.17.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.17.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.17.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.18.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.18.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.18.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.18.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.18.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.18.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.19.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.19.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.19.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.19.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.19.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.19.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.2.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.2.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.2.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.2.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.2.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.2.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.20.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.20.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.20.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.20.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.20.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.20.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.21.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.21.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.21.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.21.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.21.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.21.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.22.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.22.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.22.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.22.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.22.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.22.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.23.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.23.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.23.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.23.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.23.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.23.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.24.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.24.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.24.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.24.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.24.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.24.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.25.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.25.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.25.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.25.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.25.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.25.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.26.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.26.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.26.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.26.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.26.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.26.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.27.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.27.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.27.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.27.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.27.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.27.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.28.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.28.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.28.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.28.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.28.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.28.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.29.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.29.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.29.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.29.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.29.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.29.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.3.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.3.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.3.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.3.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.3.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.3.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.30.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.30.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.30.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.30.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.30.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.30.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.31.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.31.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.31.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.31.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.31.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.31.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.32.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.32.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.32.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.32.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.32.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.32.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.33.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.33.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.33.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.33.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.33.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.33.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.34.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.34.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.34.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.34.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.34.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.34.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.35.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.35.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.35.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.35.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.35.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.35.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.36.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.36.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.36.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.36.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.36.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.36.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.37.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.37.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.37.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.37.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.37.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.37.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.38.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.38.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.38.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.38.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.38.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.38.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.39.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.39.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.39.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.39.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.39.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.39.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.4.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.4.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.4.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.4.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.4.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.4.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.40.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.40.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.40.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.40.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.40.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.40.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.41.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.41.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.41.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.41.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.41.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.41.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.42.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.42.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.42.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.42.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.42.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.42.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.43.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.43.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.43.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.43.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.43.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.43.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.44.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.44.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.44.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.44.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.44.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.44.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.45.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.45.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.45.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.45.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.45.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.45.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.46.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.46.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.46.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.46.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.46.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.46.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.47.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.47.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.47.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.47.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.47.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.47.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.48.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.48.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.48.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.48.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.48.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.48.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.49.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.49.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.49.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.49.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.49.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.49.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.5.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.5.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.5.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.5.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.5.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.5.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.50.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.50.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.50.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.50.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.50.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.50.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.51.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.51.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.51.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.51.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.51.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.51.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.52.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.52.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.52.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.52.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.52.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.52.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.53.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.53.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.53.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.53.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.53.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.53.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.54.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.54.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.54.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.54.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.54.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.54.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.55.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.55.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.55.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.55.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.55.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.55.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.56.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.56.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.56.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.56.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.56.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.56.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.57.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.57.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.57.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.57.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.57.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.57.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.58.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.58.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.58.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.58.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.58.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.58.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.59.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.59.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.59.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.59.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.59.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.59.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.6.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.6.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.6.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.6.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.6.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.6.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.60.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.60.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.60.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.60.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.60.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.60.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.61.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.61.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.61.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.61.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.61.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.61.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.62.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.62.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.62.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.62.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.62.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.62.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.63.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.63.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.63.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.63.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.63.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.63.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.64.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.64.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.64.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.64.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.64.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.64.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.65.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.65.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.65.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.65.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.65.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.65.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.66.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.66.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.66.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.66.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.66.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.66.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.67.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.67.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.67.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.67.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.67.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.67.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.68.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.68.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.68.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.68.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.68.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.68.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.69.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.69.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.69.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.69.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.69.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.69.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.7.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.7.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.7.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.7.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.7.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.7.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.70.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.70.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.70.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.70.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.70.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.70.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.71.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.71.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.71.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.71.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.71.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.71.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.72.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.72.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.72.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.72.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.72.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.72.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.73.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.73.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.73.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.73.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.73.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.73.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.74.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.74.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.74.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.74.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.74.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.74.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.75.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.75.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.75.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.75.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.75.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.75.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.76.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.76.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.76.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.76.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.76.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.76.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.77.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.77.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.77.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.77.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.77.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.77.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.78.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.78.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.78.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.78.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.78.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.78.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.79.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.79.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.79.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.79.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.79.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.79.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.8.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.8.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.8.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.8.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.8.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.8.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.80.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.80.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.80.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.80.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.80.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.80.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.81.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.81.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.81.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.81.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.81.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.81.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.82.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.82.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.82.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.82.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.82.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.82.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.83.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.83.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.83.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.83.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.83.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.83.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.84.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.84.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.84.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.84.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.84.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.84.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.85.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.85.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.85.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.85.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.85.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.85.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.86.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.86.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.86.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.86.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.86.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.86.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.87.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.87.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.87.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.87.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.87.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.87.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.88.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.88.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.88.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.88.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.88.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.88.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.89.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.89.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.89.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.89.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.89.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.89.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.9.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.9.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.9.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.9.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.9.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.9.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.90.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.90.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.90.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.90.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.90.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.90.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.91.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.91.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.91.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.91.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.91.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.91.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.92.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.92.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.92.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.92.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.92.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.92.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.93.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.93.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.93.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.93.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.93.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.93.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.94.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.94.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.94.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.94.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.94.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.94.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.95.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.95.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.95.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.95.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.95.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.95.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.96.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.96.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.96.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.96.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.96.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.96.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.97.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.97.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.97.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.97.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.97.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.97.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.98.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.98.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.98.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.98.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.98.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.98.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.99.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.99.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.99.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.99.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.99.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.experts.99.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.gate.e_score_correction_bias": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.gate.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.shared_experts.down_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.shared_experts.down_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.shared_experts.gate_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.shared_experts.gate_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.shared_experts.up_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.mlp.shared_experts.up_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.post_attention_layernorm.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.self_attn.k_norm.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.self_attn.k_proj.bias": "model-00040-of-00092.safetensors",
+ "model.layers.39.self_attn.k_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.self_attn.k_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.self_attn.o_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.self_attn.o_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.self_attn.q_norm.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.self_attn.q_proj.bias": "model-00040-of-00092.safetensors",
+ "model.layers.39.self_attn.q_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.self_attn.q_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.39.self_attn.v_proj.bias": "model-00040-of-00092.safetensors",
+ "model.layers.39.self_attn.v_proj.weight": "model-00040-of-00092.safetensors",
+ "model.layers.39.self_attn.v_proj.weight_scale": "model-00040-of-00092.safetensors",
+ "model.layers.4.input_layernorm.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.0.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.0.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.0.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.0.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.0.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.0.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.1.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.1.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.1.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.1.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.1.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.1.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.10.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.10.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.10.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.10.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.10.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.10.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.100.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.100.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.100.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.100.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.100.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.100.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.101.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.101.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.101.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.101.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.101.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.101.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.102.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.102.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.102.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.102.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.102.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.102.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.103.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.103.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.103.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.103.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.103.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.103.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.104.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.104.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.104.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.104.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.104.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.104.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.105.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.105.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.105.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.105.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.105.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.105.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.106.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.106.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.106.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.106.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.106.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.106.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.107.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.107.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.107.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.107.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.107.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.107.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.108.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.108.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.108.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.108.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.108.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.108.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.109.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.109.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.109.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.109.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.109.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.109.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.11.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.11.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.11.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.11.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.11.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.11.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.110.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.110.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.110.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.110.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.110.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.110.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.111.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.111.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.111.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.111.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.111.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.111.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.112.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.112.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.112.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.112.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.112.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.112.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.113.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.113.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.113.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.113.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.113.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.113.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.114.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.114.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.114.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.114.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.114.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.114.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.115.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.115.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.115.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.115.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.115.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.115.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.116.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.116.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.116.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.116.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.116.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.116.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.117.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.117.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.117.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.117.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.117.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.117.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.118.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.118.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.118.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.118.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.118.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.118.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.119.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.119.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.119.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.119.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.119.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.119.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.12.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.12.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.12.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.12.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.12.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.12.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.120.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.120.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.120.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.120.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.120.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.120.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.121.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.121.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.121.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.121.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.121.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.121.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.122.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.122.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.122.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.122.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.122.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.122.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.123.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.123.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.123.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.123.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.123.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.123.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.124.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.124.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.124.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.124.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.124.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.124.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.125.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.125.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.125.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.125.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.125.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.125.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.126.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.126.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.126.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.126.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.126.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.126.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.127.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.127.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.127.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.127.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.127.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.127.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.128.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.128.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.128.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.128.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.128.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.128.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.129.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.129.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.129.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.129.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.129.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.129.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.13.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.13.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.13.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.13.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.13.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.13.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.130.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.130.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.130.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.130.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.130.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.130.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.131.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.131.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.131.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.131.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.131.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.131.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.132.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.132.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.132.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.132.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.132.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.132.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.133.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.133.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.133.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.133.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.133.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.133.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.134.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.134.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.134.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.134.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.134.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.134.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.135.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.135.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.135.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.135.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.135.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.135.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.136.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.136.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.136.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.136.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.136.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.136.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.137.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.137.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.137.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.137.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.137.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.137.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.138.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.138.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.138.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.138.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.138.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.138.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.139.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.139.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.139.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.139.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.139.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.139.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.14.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.14.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.14.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.14.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.14.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.14.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.140.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.140.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.140.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.140.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.140.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.140.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.141.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.141.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.141.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.141.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.141.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.141.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.142.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.142.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.142.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.142.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.142.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.142.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.143.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.143.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.143.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.143.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.143.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.143.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.144.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.144.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.144.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.144.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.144.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.144.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.145.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.145.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.145.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.145.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.145.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.145.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.146.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.146.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.146.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.146.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.146.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.146.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.147.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.147.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.147.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.147.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.147.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.147.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.148.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.148.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.148.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.148.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.148.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.148.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.149.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.149.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.149.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.149.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.149.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.149.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.15.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.15.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.15.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.15.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.15.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.15.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.150.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.150.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.150.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.150.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.150.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.150.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.151.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.151.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.151.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.151.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.151.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.151.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.152.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.152.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.152.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.152.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.152.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.152.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.153.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.153.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.153.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.153.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.153.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.153.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.154.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.154.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.154.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.154.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.154.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.154.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.155.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.155.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.155.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.155.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.155.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.155.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.156.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.156.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.156.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.156.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.156.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.156.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.157.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.157.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.157.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.157.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.157.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.157.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.158.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.158.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.158.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.158.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.158.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.158.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.159.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.159.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.159.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.159.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.159.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.159.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.16.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.16.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.16.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.16.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.16.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.16.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.17.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.17.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.17.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.17.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.17.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.17.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.18.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.18.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.18.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.18.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.18.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.18.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.19.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.19.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.19.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.19.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.19.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.19.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.2.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.2.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.2.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.2.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.2.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.2.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.20.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.20.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.20.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.20.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.20.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.20.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.21.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.21.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.21.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.21.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.21.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.21.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.22.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.22.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.22.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.22.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.22.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.22.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.23.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.23.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.23.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.23.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.23.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.23.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.24.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.24.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.24.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.24.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.24.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.24.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.25.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.25.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.25.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.25.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.25.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.25.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.26.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.26.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.26.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.26.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.26.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.26.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.27.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.27.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.27.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.27.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.27.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.27.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.28.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.28.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.28.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.28.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.28.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.28.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.29.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.29.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.29.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.29.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.29.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.29.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.3.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.3.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.3.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.3.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.3.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.3.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.30.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.30.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.30.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.30.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.30.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.30.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.31.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.31.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.31.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.31.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.31.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.31.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.32.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.32.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.32.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.32.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.32.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.32.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.33.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.33.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.33.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.33.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.33.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.33.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.34.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.34.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.34.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.34.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.34.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.34.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.35.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.35.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.35.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.35.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.35.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.35.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.36.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.36.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.36.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.36.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.36.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.36.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.37.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.37.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.37.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.37.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.37.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.37.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.38.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.38.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.38.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.38.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.38.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.38.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.39.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.39.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.39.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.39.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.39.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.39.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.4.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.4.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.4.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.4.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.4.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.4.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.40.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.40.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.40.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.40.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.40.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.40.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.41.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.41.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.41.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.41.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.41.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.41.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.42.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.42.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.42.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.42.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.42.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.42.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.43.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.43.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.43.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.43.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.43.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.43.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.44.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.44.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.44.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.44.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.44.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.44.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.45.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.45.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.45.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.45.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.45.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.45.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.46.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.46.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.46.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.46.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.46.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.46.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.47.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.47.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.47.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.47.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.47.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.47.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.48.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.48.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.48.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.48.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.48.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.48.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.49.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.49.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.49.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.49.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.49.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.49.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.5.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.5.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.5.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.5.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.5.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.5.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.50.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.50.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.50.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.50.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.50.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.50.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.51.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.51.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.51.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.51.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.51.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.51.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.52.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.52.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.52.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.52.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.52.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.52.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.53.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.53.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.53.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.53.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.53.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.53.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.54.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.54.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.54.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.54.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.54.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.54.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.55.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.55.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.55.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.55.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.55.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.55.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.56.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.56.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.56.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.56.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.56.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.56.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.57.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.57.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.57.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.57.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.57.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.57.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.58.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.58.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.58.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.58.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.58.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.58.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.59.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.59.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.59.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.59.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.59.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.59.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.6.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.6.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.6.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.6.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.6.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.6.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.60.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.60.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.60.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.60.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.60.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.60.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.61.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.61.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.61.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.61.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.61.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.61.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.62.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.62.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.62.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.62.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.62.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.62.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.63.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.63.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.63.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.63.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.63.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.63.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.64.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.64.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.64.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.64.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.64.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.64.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.65.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.65.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.65.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.65.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.65.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.65.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.66.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.66.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.66.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.66.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.66.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.66.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.67.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.67.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.67.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.67.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.67.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.67.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.68.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.68.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.68.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.68.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.68.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.68.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.69.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.69.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.69.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.69.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.69.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.69.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.7.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.7.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.7.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.7.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.7.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.7.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.70.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.70.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.70.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.70.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.70.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.70.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.71.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.71.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.71.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.71.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.71.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.71.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.72.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.72.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.72.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.72.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.72.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.72.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.73.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.73.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.73.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.73.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.73.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.73.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.74.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.74.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.74.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.74.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.74.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.74.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.75.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.75.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.75.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.75.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.75.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.75.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.76.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.76.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.76.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.76.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.76.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.76.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.77.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.77.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.77.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.77.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.77.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.77.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.78.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.78.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.78.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.78.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.78.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.78.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.79.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.79.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.79.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.79.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.79.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.79.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.8.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.8.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.8.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.8.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.8.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.8.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.80.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.80.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.80.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.80.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.80.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.80.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.81.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.81.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.81.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.81.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.81.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.81.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.82.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.82.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.82.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.82.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.82.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.82.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.83.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.83.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.83.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.83.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.83.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.83.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.84.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.84.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.84.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.84.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.84.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.84.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.85.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.85.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.85.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.85.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.85.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.85.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.86.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.86.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.86.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.86.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.86.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.86.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.87.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.87.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.87.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.87.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.87.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.87.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.88.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.88.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.88.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.88.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.88.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.88.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.89.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.89.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.89.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.89.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.89.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.89.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.9.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.9.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.9.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.9.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.9.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.9.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.90.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.90.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.90.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.90.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.90.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.90.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.91.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.91.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.91.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.91.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.91.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.91.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.92.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.92.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.92.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.92.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.92.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.92.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.93.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.93.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.93.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.93.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.93.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.93.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.94.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.94.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.94.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.94.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.94.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.94.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.95.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.95.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.95.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.95.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.95.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.95.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.96.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.96.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.96.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.96.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.96.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.96.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.97.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.97.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.97.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.97.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.97.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.97.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.98.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.98.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.98.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.98.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.98.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.98.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.99.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.99.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.99.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.99.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.99.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.experts.99.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.gate.e_score_correction_bias": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.gate.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.shared_experts.down_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.shared_experts.down_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.shared_experts.gate_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.shared_experts.gate_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.shared_experts.up_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.mlp.shared_experts.up_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.post_attention_layernorm.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.self_attn.k_norm.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.self_attn.k_proj.bias": "model-00005-of-00092.safetensors",
+ "model.layers.4.self_attn.k_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.self_attn.k_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.self_attn.o_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.self_attn.o_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.self_attn.q_norm.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.self_attn.q_proj.bias": "model-00005-of-00092.safetensors",
+ "model.layers.4.self_attn.q_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.self_attn.q_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.4.self_attn.v_proj.bias": "model-00005-of-00092.safetensors",
+ "model.layers.4.self_attn.v_proj.weight": "model-00005-of-00092.safetensors",
+ "model.layers.4.self_attn.v_proj.weight_scale": "model-00005-of-00092.safetensors",
+ "model.layers.40.input_layernorm.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.0.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.0.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.0.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.0.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.0.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.0.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.1.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.1.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.1.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.1.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.1.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.1.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.10.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.10.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.10.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.10.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.10.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.10.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.100.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.100.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.100.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.100.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.100.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.100.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.101.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.101.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.101.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.101.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.101.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.101.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.102.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.102.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.102.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.102.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.102.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.102.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.103.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.103.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.103.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.103.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.103.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.103.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.104.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.104.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.104.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.104.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.104.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.104.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.105.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.105.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.105.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.105.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.105.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.105.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.106.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.106.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.106.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.106.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.106.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.106.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.107.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.107.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.107.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.107.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.107.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.107.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.108.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.108.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.108.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.108.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.108.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.108.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.109.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.109.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.109.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.109.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.109.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.109.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.11.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.11.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.11.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.11.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.11.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.11.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.110.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.110.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.110.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.110.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.110.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.110.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.111.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.111.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.111.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.111.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.111.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.111.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.112.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.112.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.112.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.112.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.112.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.112.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.113.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.113.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.113.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.113.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.113.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.113.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.114.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.114.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.114.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.114.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.114.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.114.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.115.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.115.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.115.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.115.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.115.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.115.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.116.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.116.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.116.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.116.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.116.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.116.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.117.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.117.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.117.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.117.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.117.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.117.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.118.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.118.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.118.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.118.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.118.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.118.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.119.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.119.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.119.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.119.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.119.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.119.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.12.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.12.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.12.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.12.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.12.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.12.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.120.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.120.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.120.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.120.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.120.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.120.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.121.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.121.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.121.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.121.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.121.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.121.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.122.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.122.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.122.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.122.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.122.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.122.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.123.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.123.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.123.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.123.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.123.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.123.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.124.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.124.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.124.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.124.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.124.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.124.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.125.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.125.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.125.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.125.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.125.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.125.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.126.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.126.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.126.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.126.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.126.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.126.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.127.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.127.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.127.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.127.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.127.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.127.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.128.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.128.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.128.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.128.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.128.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.128.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.129.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.129.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.129.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.129.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.129.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.129.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.13.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.13.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.13.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.13.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.13.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.13.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.130.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.130.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.130.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.130.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.130.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.130.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.131.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.131.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.131.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.131.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.131.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.131.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.132.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.132.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.132.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.132.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.132.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.132.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.133.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.133.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.133.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.133.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.133.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.133.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.134.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.134.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.134.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.134.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.134.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.134.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.135.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.135.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.135.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.135.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.135.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.135.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.136.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.136.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.136.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.136.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.136.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.136.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.137.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.137.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.137.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.137.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.137.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.137.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.138.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.138.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.138.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.138.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.138.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.138.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.139.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.139.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.139.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.139.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.139.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.139.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.14.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.14.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.14.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.14.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.14.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.14.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.140.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.140.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.140.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.140.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.140.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.140.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.141.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.141.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.141.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.141.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.141.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.141.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.142.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.142.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.142.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.142.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.142.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.142.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.143.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.143.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.143.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.143.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.143.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.143.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.144.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.144.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.144.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.144.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.144.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.144.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.145.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.145.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.145.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.145.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.145.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.145.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.146.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.146.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.146.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.146.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.146.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.146.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.147.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.147.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.147.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.147.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.147.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.147.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.148.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.148.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.148.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.148.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.148.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.148.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.149.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.149.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.149.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.149.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.149.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.149.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.15.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.15.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.15.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.15.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.15.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.15.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.150.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.150.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.150.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.150.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.150.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.150.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.151.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.151.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.151.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.151.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.151.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.151.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.152.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.152.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.152.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.152.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.152.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.152.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.153.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.153.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.153.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.153.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.153.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.153.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.154.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.154.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.154.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.154.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.154.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.154.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.155.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.155.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.155.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.155.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.155.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.155.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.156.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.156.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.156.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.156.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.156.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.156.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.157.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.157.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.157.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.157.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.157.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.157.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.158.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.158.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.158.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.158.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.158.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.158.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.159.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.159.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.159.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.159.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.159.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.159.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.16.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.16.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.16.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.16.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.16.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.16.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.17.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.17.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.17.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.17.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.17.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.17.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.18.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.18.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.18.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.18.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.18.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.18.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.19.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.19.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.19.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.19.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.19.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.19.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.2.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.2.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.2.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.2.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.2.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.2.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.20.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.20.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.20.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.20.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.20.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.20.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.21.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.21.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.21.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.21.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.21.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.21.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.22.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.22.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.22.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.22.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.22.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.22.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.23.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.23.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.23.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.23.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.23.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.23.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.24.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.24.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.24.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.24.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.24.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.24.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.25.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.25.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.25.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.25.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.25.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.25.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.26.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.26.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.26.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.26.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.26.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.26.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.27.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.27.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.27.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.27.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.27.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.27.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.28.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.28.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.28.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.28.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.28.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.28.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.29.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.29.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.29.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.29.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.29.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.29.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.3.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.3.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.3.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.3.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.3.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.3.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.30.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.30.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.30.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.30.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.30.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.30.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.31.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.31.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.31.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.31.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.31.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.31.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.32.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.32.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.32.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.32.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.32.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.32.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.33.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.33.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.33.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.33.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.33.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.33.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.34.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.34.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.34.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.34.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.34.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.34.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.35.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.35.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.35.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.35.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.35.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.35.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.36.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.36.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.36.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.36.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.36.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.36.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.37.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.37.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.37.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.37.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.37.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.37.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.38.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.38.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.38.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.38.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.38.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.38.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.39.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.39.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.39.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.39.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.39.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.39.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.4.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.4.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.4.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.4.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.4.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.4.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.40.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.40.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.40.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.40.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.40.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.40.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.41.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.41.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.41.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.41.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.41.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.41.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.42.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.42.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.42.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.42.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.42.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.42.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.43.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.43.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.43.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.43.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.43.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.43.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.44.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.44.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.44.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.44.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.44.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.44.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.45.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.45.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.45.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.45.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.45.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.45.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.46.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.46.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.46.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.46.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.46.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.46.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.47.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.47.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.47.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.47.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.47.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.47.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.48.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.48.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.48.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.48.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.48.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.48.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.49.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.49.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.49.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.49.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.49.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.49.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.5.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.5.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.5.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.5.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.5.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.5.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.50.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.50.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.50.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.50.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.50.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.50.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.51.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.51.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.51.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.51.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.51.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.51.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.52.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.52.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.52.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.52.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.52.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.52.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.53.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.53.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.53.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.53.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.53.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.53.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.54.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.54.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.54.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.54.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.54.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.54.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.55.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.55.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.55.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.55.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.55.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.55.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.56.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.56.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.56.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.56.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.56.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.56.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.57.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.57.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.57.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.57.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.57.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.57.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.58.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.58.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.58.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.58.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.58.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.58.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.59.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.59.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.59.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.59.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.59.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.59.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.6.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.6.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.6.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.6.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.6.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.6.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.60.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.60.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.60.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.60.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.60.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.60.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.61.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.61.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.61.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.61.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.61.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.61.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.62.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.62.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.62.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.62.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.62.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.62.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.63.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.63.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.63.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.63.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.63.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.63.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.64.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.64.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.64.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.64.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.64.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.64.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.65.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.65.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.65.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.65.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.65.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.65.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.66.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.66.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.66.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.66.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.66.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.66.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.67.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.67.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.67.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.67.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.67.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.67.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.68.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.68.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.68.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.68.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.68.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.68.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.69.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.69.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.69.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.69.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.69.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.69.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.7.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.7.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.7.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.7.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.7.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.7.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.70.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.70.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.70.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.70.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.70.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.70.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.71.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.71.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.71.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.71.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.71.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.71.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.72.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.72.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.72.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.72.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.72.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.72.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.73.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.73.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.73.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.73.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.73.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.73.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.74.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.74.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.74.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.74.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.74.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.74.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.75.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.75.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.75.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.75.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.75.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.75.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.76.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.76.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.76.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.76.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.76.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.76.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.77.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.77.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.77.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.77.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.77.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.77.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.78.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.78.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.78.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.78.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.78.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.78.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.79.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.79.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.79.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.79.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.79.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.79.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.8.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.8.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.8.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.8.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.8.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.8.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.80.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.80.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.80.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.80.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.80.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.80.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.81.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.81.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.81.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.81.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.81.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.81.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.82.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.82.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.82.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.82.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.82.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.82.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.83.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.83.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.83.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.83.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.83.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.83.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.84.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.84.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.84.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.84.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.84.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.84.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.85.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.85.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.85.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.85.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.85.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.85.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.86.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.86.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.86.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.86.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.86.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.86.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.87.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.87.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.87.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.87.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.87.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.87.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.88.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.88.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.88.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.88.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.88.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.88.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.89.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.89.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.89.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.89.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.89.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.89.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.9.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.9.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.9.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.9.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.9.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.9.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.90.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.90.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.90.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.90.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.90.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.90.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.91.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.91.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.91.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.91.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.91.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.91.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.92.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.92.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.92.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.92.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.92.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.92.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.93.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.93.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.93.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.93.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.93.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.93.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.94.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.94.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.94.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.94.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.94.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.94.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.95.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.95.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.95.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.95.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.95.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.95.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.96.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.96.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.96.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.96.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.96.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.96.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.97.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.97.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.97.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.97.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.97.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.97.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.98.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.98.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.98.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.98.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.98.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.98.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.99.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.99.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.99.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.99.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.99.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.experts.99.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.gate.e_score_correction_bias": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.gate.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.shared_experts.down_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.shared_experts.down_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.shared_experts.gate_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.shared_experts.gate_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.shared_experts.up_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.mlp.shared_experts.up_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.post_attention_layernorm.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.self_attn.k_norm.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.self_attn.k_proj.bias": "model-00041-of-00092.safetensors",
+ "model.layers.40.self_attn.k_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.self_attn.k_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.self_attn.o_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.self_attn.o_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.self_attn.q_norm.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.self_attn.q_proj.bias": "model-00041-of-00092.safetensors",
+ "model.layers.40.self_attn.q_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.self_attn.q_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.40.self_attn.v_proj.bias": "model-00041-of-00092.safetensors",
+ "model.layers.40.self_attn.v_proj.weight": "model-00041-of-00092.safetensors",
+ "model.layers.40.self_attn.v_proj.weight_scale": "model-00041-of-00092.safetensors",
+ "model.layers.41.input_layernorm.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.0.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.0.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.0.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.0.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.0.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.0.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.1.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.1.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.1.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.1.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.1.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.1.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.10.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.10.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.10.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.10.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.10.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.10.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.100.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.100.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.100.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.100.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.100.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.100.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.101.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.101.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.101.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.101.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.101.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.101.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.102.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.102.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.102.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.102.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.102.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.102.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.103.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.103.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.103.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.103.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.103.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.103.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.104.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.104.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.104.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.104.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.104.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.104.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.105.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.105.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.105.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.105.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.105.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.105.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.106.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.106.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.106.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.106.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.106.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.106.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.107.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.107.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.107.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.107.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.107.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.107.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.108.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.108.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.108.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.108.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.108.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.108.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.109.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.109.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.109.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.109.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.109.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.109.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.11.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.11.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.11.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.11.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.11.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.11.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.110.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.110.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.110.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.110.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.110.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.110.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.111.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.111.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.111.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.111.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.111.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.111.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.112.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.112.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.112.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.112.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.112.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.112.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.113.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.113.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.113.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.113.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.113.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.113.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.114.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.114.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.114.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.114.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.114.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.114.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.115.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.115.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.115.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.115.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.115.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.115.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.116.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.116.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.116.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.116.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.116.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.116.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.117.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.117.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.117.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.117.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.117.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.117.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.118.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.118.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.118.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.118.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.118.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.118.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.119.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.119.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.119.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.119.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.119.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.119.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.12.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.12.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.12.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.12.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.12.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.12.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.120.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.120.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.120.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.120.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.120.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.120.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.121.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.121.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.121.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.121.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.121.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.121.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.122.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.122.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.122.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.122.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.122.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.122.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.123.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.123.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.123.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.123.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.123.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.123.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.124.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.124.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.124.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.124.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.124.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.124.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.125.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.125.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.125.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.125.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.125.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.125.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.126.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.126.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.126.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.126.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.126.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.126.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.127.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.127.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.127.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.127.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.127.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.127.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.128.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.128.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.128.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.128.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.128.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.128.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.129.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.129.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.129.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.129.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.129.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.129.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.13.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.13.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.13.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.13.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.13.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.13.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.130.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.130.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.130.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.130.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.130.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.130.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.131.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.131.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.131.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.131.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.131.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.131.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.132.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.132.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.132.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.132.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.132.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.132.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.133.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.133.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.133.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.133.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.133.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.133.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.134.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.134.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.134.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.134.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.134.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.134.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.135.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.135.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.135.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.135.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.135.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.135.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.136.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.136.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.136.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.136.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.136.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.136.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.137.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.137.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.137.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.137.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.137.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.137.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.138.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.138.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.138.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.138.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.138.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.138.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.139.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.139.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.139.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.139.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.139.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.139.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.14.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.14.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.14.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.14.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.14.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.14.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.140.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.140.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.140.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.140.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.140.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.140.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.141.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.141.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.141.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.141.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.141.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.141.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.142.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.142.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.142.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.142.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.142.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.142.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.143.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.143.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.143.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.143.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.143.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.143.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.144.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.144.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.144.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.144.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.144.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.144.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.145.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.145.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.145.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.145.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.145.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.145.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.146.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.146.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.146.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.146.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.146.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.146.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.147.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.147.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.147.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.147.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.147.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.147.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.148.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.148.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.148.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.148.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.148.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.148.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.149.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.149.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.149.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.149.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.149.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.149.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.15.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.15.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.15.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.15.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.15.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.15.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.150.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.150.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.150.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.150.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.150.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.150.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.151.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.151.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.151.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.151.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.151.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.151.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.152.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.152.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.152.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.152.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.152.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.152.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.153.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.153.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.153.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.153.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.153.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.153.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.154.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.154.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.154.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.154.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.154.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.154.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.155.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.155.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.155.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.155.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.155.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.155.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.156.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.156.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.156.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.156.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.156.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.156.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.157.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.157.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.157.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.157.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.157.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.157.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.158.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.158.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.158.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.158.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.158.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.158.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.159.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.159.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.159.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.159.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.159.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.159.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.16.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.16.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.16.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.16.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.16.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.16.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.17.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.17.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.17.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.17.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.17.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.17.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.18.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.18.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.18.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.18.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.18.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.18.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.19.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.19.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.19.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.19.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.19.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.19.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.2.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.2.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.2.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.2.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.2.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.2.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.20.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.20.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.20.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.20.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.20.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.20.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.21.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.21.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.21.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.21.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.21.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.21.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.22.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.22.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.22.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.22.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.22.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.22.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.23.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.23.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.23.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.23.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.23.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.23.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.24.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.24.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.24.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.24.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.24.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.24.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.25.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.25.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.25.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.25.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.25.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.25.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.26.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.26.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.26.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.26.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.26.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.26.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.27.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.27.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.27.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.27.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.27.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.27.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.28.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.28.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.28.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.28.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.28.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.28.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.29.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.29.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.29.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.29.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.29.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.29.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.3.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.3.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.3.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.3.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.3.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.3.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.30.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.30.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.30.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.30.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.30.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.30.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.31.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.31.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.31.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.31.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.31.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.31.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.32.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.32.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.32.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.32.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.32.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.32.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.33.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.33.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.33.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.33.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.33.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.33.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.34.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.34.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.34.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.34.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.34.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.34.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.35.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.35.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.35.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.35.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.35.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.35.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.36.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.36.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.36.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.36.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.36.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.36.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.37.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.37.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.37.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.37.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.37.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.37.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.38.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.38.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.38.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.38.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.38.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.38.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.39.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.39.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.39.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.39.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.39.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.39.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.4.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.4.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.4.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.4.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.4.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.4.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.40.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.40.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.40.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.40.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.40.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.40.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.41.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.41.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.41.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.41.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.41.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.41.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.42.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.42.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.42.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.42.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.42.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.42.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.43.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.43.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.43.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.43.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.43.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.43.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.44.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.44.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.44.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.44.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.44.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.44.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.45.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.45.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.45.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.45.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.45.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.45.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.46.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.46.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.46.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.46.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.46.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.46.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.47.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.47.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.47.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.47.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.47.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.47.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.48.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.48.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.48.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.48.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.48.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.48.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.49.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.49.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.49.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.49.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.49.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.49.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.5.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.5.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.5.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.5.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.5.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.5.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.50.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.50.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.50.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.50.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.50.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.50.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.51.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.51.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.51.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.51.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.51.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.51.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.52.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.52.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.52.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.52.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.52.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.52.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.53.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.53.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.53.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.53.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.53.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.53.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.54.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.54.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.54.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.54.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.54.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.54.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.55.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.55.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.55.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.55.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.55.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.55.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.56.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.56.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.56.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.56.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.56.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.56.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.57.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.57.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.57.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.57.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.57.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.57.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.58.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.58.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.58.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.58.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.58.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.58.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.59.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.59.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.59.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.59.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.59.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.59.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.6.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.6.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.6.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.6.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.6.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.6.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.60.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.60.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.60.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.60.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.60.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.60.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.61.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.61.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.61.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.61.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.61.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.61.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.62.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.62.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.62.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.62.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.62.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.62.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.63.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.63.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.63.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.63.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.63.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.63.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.64.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.64.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.64.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.64.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.64.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.64.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.65.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.65.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.65.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.65.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.65.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.65.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.66.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.66.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.66.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.66.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.66.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.66.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.67.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.67.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.67.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.67.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.67.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.67.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.68.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.68.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.68.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.68.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.68.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.68.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.69.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.69.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.69.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.69.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.69.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.69.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.7.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.7.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.7.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.7.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.7.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.7.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.70.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.70.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.70.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.70.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.70.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.70.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.71.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.71.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.71.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.71.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.71.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.71.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.72.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.72.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.72.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.72.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.72.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.72.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.73.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.73.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.73.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.73.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.73.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.73.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.74.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.74.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.74.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.74.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.74.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.74.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.75.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.75.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.75.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.75.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.75.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.75.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.76.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.76.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.76.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.76.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.76.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.76.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.77.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.77.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.77.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.77.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.77.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.77.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.78.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.78.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.78.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.78.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.78.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.78.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.79.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.79.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.79.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.79.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.79.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.79.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.8.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.8.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.8.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.8.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.8.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.8.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.80.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.80.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.80.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.80.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.80.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.80.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.81.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.81.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.81.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.81.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.81.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.81.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.82.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.82.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.82.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.82.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.82.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.82.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.83.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.83.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.83.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.83.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.83.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.83.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.84.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.84.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.84.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.84.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.84.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.84.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.85.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.85.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.85.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.85.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.85.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.85.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.86.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.86.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.86.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.86.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.86.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.86.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.87.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.87.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.87.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.87.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.87.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.87.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.88.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.88.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.88.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.88.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.88.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.88.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.89.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.89.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.89.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.89.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.89.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.89.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.9.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.9.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.9.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.9.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.9.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.9.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.90.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.90.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.90.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.90.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.90.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.90.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.91.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.91.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.91.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.91.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.91.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.91.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.92.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.92.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.92.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.92.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.92.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.92.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.93.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.93.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.93.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.93.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.93.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.93.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.94.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.94.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.94.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.94.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.94.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.94.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.95.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.95.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.95.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.95.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.95.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.95.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.96.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.96.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.96.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.96.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.96.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.96.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.97.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.97.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.97.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.97.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.97.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.97.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.98.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.98.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.98.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.98.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.98.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.98.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.99.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.99.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.99.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.99.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.99.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.experts.99.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.gate.e_score_correction_bias": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.gate.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.shared_experts.down_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.shared_experts.down_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.shared_experts.gate_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.shared_experts.gate_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.shared_experts.up_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.mlp.shared_experts.up_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.post_attention_layernorm.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.self_attn.k_norm.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.self_attn.k_proj.bias": "model-00042-of-00092.safetensors",
+ "model.layers.41.self_attn.k_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.self_attn.k_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.self_attn.o_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.self_attn.o_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.self_attn.q_norm.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.self_attn.q_proj.bias": "model-00042-of-00092.safetensors",
+ "model.layers.41.self_attn.q_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.self_attn.q_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.41.self_attn.v_proj.bias": "model-00042-of-00092.safetensors",
+ "model.layers.41.self_attn.v_proj.weight": "model-00042-of-00092.safetensors",
+ "model.layers.41.self_attn.v_proj.weight_scale": "model-00042-of-00092.safetensors",
+ "model.layers.42.input_layernorm.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.0.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.0.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.0.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.0.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.0.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.0.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.1.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.1.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.1.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.1.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.1.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.1.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.10.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.10.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.10.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.10.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.10.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.10.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.100.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.100.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.100.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.100.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.100.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.100.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.101.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.101.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.101.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.101.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.101.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.101.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.102.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.102.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.102.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.102.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.102.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.102.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.103.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.103.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.103.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.103.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.103.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.103.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.104.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.104.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.104.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.104.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.104.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.104.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.105.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.105.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.105.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.105.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.105.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.105.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.106.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.106.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.106.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.106.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.106.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.106.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.107.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.107.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.107.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.107.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.107.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.107.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.108.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.108.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.108.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.108.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.108.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.108.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.109.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.109.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.109.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.109.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.109.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.109.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.11.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.11.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.11.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.11.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.11.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.11.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.110.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.110.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.110.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.110.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.110.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.110.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.111.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.111.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.111.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.111.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.111.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.111.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.112.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.112.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.112.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.112.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.112.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.112.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.113.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.113.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.113.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.113.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.113.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.113.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.114.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.114.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.114.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.114.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.114.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.114.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.115.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.115.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.115.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.115.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.115.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.115.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.116.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.116.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.116.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.116.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.116.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.116.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.117.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.117.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.117.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.117.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.117.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.117.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.118.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.118.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.118.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.118.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.118.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.118.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.119.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.119.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.119.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.119.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.119.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.119.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.12.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.12.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.12.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.12.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.12.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.12.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.120.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.120.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.120.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.120.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.120.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.120.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.121.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.121.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.121.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.121.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.121.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.121.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.122.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.122.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.122.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.122.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.122.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.122.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.123.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.123.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.123.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.123.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.123.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.123.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.124.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.124.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.124.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.124.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.124.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.124.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.125.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.125.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.125.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.125.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.125.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.125.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.126.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.126.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.126.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.126.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.126.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.126.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.127.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.127.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.127.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.127.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.127.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.127.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.128.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.128.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.128.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.128.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.128.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.128.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.129.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.129.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.129.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.129.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.129.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.129.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.13.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.13.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.13.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.13.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.13.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.13.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.130.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.130.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.130.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.130.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.130.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.130.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.131.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.131.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.131.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.131.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.131.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.131.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.132.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.132.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.132.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.132.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.132.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.132.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.133.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.133.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.133.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.133.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.133.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.133.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.134.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.134.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.134.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.134.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.134.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.134.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.135.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.135.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.135.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.135.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.135.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.135.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.136.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.136.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.136.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.136.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.136.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.136.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.137.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.137.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.137.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.137.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.137.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.137.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.138.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.138.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.138.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.138.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.138.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.138.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.139.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.139.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.139.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.139.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.139.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.139.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.14.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.14.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.14.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.14.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.14.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.14.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.140.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.140.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.140.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.140.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.140.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.140.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.141.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.141.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.141.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.141.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.141.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.141.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.142.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.142.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.142.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.142.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.142.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.142.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.143.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.143.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.143.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.143.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.143.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.143.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.144.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.144.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.144.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.144.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.144.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.144.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.145.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.145.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.145.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.145.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.145.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.145.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.146.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.146.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.146.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.146.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.146.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.146.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.147.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.147.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.147.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.147.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.147.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.147.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.148.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.148.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.148.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.148.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.148.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.148.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.149.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.149.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.149.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.149.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.149.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.149.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.15.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.15.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.15.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.15.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.15.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.15.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.150.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.150.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.150.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.150.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.150.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.150.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.151.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.151.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.151.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.151.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.151.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.151.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.152.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.152.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.152.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.152.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.152.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.152.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.153.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.153.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.153.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.153.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.153.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.153.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.154.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.154.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.154.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.154.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.154.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.154.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.155.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.155.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.155.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.155.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.155.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.155.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.156.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.156.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.156.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.156.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.156.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.156.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.157.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.157.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.157.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.157.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.157.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.157.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.158.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.158.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.158.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.158.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.158.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.158.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.159.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.159.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.159.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.159.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.159.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.159.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.16.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.16.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.16.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.16.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.16.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.16.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.17.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.17.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.17.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.17.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.17.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.17.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.18.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.18.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.18.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.18.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.18.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.18.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.19.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.19.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.19.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.19.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.19.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.19.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.2.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.2.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.2.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.2.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.2.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.2.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.20.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.20.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.20.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.20.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.20.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.20.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.21.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.21.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.21.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.21.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.21.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.21.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.22.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.22.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.22.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.22.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.22.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.22.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.23.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.23.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.23.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.23.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.23.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.23.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.24.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.24.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.24.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.24.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.24.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.24.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.25.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.25.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.25.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.25.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.25.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.25.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.26.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.26.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.26.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.26.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.26.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.26.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.27.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.27.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.27.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.27.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.27.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.27.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.28.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.28.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.28.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.28.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.28.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.28.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.29.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.29.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.29.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.29.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.29.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.29.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.3.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.3.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.3.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.3.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.3.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.3.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.30.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.30.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.30.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.30.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.30.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.30.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.31.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.31.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.31.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.31.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.31.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.31.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.32.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.32.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.32.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.32.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.32.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.32.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.33.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.33.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.33.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.33.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.33.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.33.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.34.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.34.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.34.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.34.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.34.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.34.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.35.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.35.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.35.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.35.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.35.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.35.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.36.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.36.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.36.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.36.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.36.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.36.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.37.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.37.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.37.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.37.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.37.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.37.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.38.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.38.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.38.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.38.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.38.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.38.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.39.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.39.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.39.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.39.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.39.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.39.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.4.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.4.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.4.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.4.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.4.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.4.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.40.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.40.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.40.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.40.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.40.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.40.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.41.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.41.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.41.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.41.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.41.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.41.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.42.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.42.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.42.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.42.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.42.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.42.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.43.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.43.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.43.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.43.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.43.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.43.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.44.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.44.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.44.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.44.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.44.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.44.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.45.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.45.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.45.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.45.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.45.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.45.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.46.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.46.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.46.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.46.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.46.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.46.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.47.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.47.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.47.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.47.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.47.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.47.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.48.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.48.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.48.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.48.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.48.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.48.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.49.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.49.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.49.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.49.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.49.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.49.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.5.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.5.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.5.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.5.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.5.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.5.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.50.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.50.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.50.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.50.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.50.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.50.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.51.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.51.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.51.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.51.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.51.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.51.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.52.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.52.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.52.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.52.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.52.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.52.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.53.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.53.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.53.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.53.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.53.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.53.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.54.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.54.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.54.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.54.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.54.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.54.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.55.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.55.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.55.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.55.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.55.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.55.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.56.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.56.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.56.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.56.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.56.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.56.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.57.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.57.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.57.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.57.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.57.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.57.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.58.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.58.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.58.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.58.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.58.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.58.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.59.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.59.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.59.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.59.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.59.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.59.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.6.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.6.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.6.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.6.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.6.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.6.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.60.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.60.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.60.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.60.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.60.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.60.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.61.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.61.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.61.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.61.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.61.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.61.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.62.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.62.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.62.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.62.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.62.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.62.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.63.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.63.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.63.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.63.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.63.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.63.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.64.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.64.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.64.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.64.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.64.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.64.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.65.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.65.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.65.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.65.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.65.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.65.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.66.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.66.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.66.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.66.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.66.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.66.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.67.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.67.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.67.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.67.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.67.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.67.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.68.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.68.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.68.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.68.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.68.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.68.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.69.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.69.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.69.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.69.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.69.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.69.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.7.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.7.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.7.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.7.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.7.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.7.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.70.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.70.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.70.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.70.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.70.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.70.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.71.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.71.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.71.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.71.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.71.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.71.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.72.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.72.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.72.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.72.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.72.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.72.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.73.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.73.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.73.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.73.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.73.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.73.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.74.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.74.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.74.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.74.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.74.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.74.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.75.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.75.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.75.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.75.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.75.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.75.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.76.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.76.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.76.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.76.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.76.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.76.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.77.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.77.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.77.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.77.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.77.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.77.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.78.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.78.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.78.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.78.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.78.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.78.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.79.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.79.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.79.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.79.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.79.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.79.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.8.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.8.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.8.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.8.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.8.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.8.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.80.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.80.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.80.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.80.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.80.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.80.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.81.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.81.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.81.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.81.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.81.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.81.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.82.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.82.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.82.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.82.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.82.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.82.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.83.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.83.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.83.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.83.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.83.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.83.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.84.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.84.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.84.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.84.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.84.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.84.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.85.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.85.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.85.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.85.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.85.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.85.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.86.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.86.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.86.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.86.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.86.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.86.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.87.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.87.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.87.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.87.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.87.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.87.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.88.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.88.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.88.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.88.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.88.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.88.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.89.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.89.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.89.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.89.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.89.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.89.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.9.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.9.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.9.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.9.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.9.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.9.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.90.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.90.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.90.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.90.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.90.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.90.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.91.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.91.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.91.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.91.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.91.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.91.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.92.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.92.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.92.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.92.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.92.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.92.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.93.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.93.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.93.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.93.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.93.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.93.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.94.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.94.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.94.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.94.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.94.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.94.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.95.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.95.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.95.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.95.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.95.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.95.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.96.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.96.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.96.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.96.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.96.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.96.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.97.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.97.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.97.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.97.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.97.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.97.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.98.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.98.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.98.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.98.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.98.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.98.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.99.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.99.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.99.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.99.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.99.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.experts.99.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.gate.e_score_correction_bias": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.gate.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.shared_experts.down_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.shared_experts.down_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.shared_experts.gate_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.shared_experts.gate_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.shared_experts.up_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.mlp.shared_experts.up_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.post_attention_layernorm.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.self_attn.k_norm.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.self_attn.k_proj.bias": "model-00043-of-00092.safetensors",
+ "model.layers.42.self_attn.k_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.self_attn.k_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.self_attn.o_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.self_attn.o_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.self_attn.q_norm.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.self_attn.q_proj.bias": "model-00043-of-00092.safetensors",
+ "model.layers.42.self_attn.q_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.self_attn.q_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.42.self_attn.v_proj.bias": "model-00043-of-00092.safetensors",
+ "model.layers.42.self_attn.v_proj.weight": "model-00043-of-00092.safetensors",
+ "model.layers.42.self_attn.v_proj.weight_scale": "model-00043-of-00092.safetensors",
+ "model.layers.43.input_layernorm.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.0.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.0.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.0.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.0.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.0.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.0.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.1.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.1.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.1.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.1.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.1.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.1.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.10.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.10.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.10.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.10.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.10.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.10.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.100.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.100.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.100.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.100.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.100.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.100.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.101.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.101.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.101.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.101.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.101.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.101.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.102.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.102.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.102.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.102.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.102.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.102.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.103.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.103.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.103.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.103.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.103.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.103.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.104.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.104.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.104.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.104.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.104.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.104.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.105.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.105.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.105.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.105.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.105.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.105.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.106.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.106.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.106.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.106.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.106.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.106.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.107.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.107.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.107.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.107.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.107.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.107.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.108.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.108.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.108.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.108.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.108.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.108.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.109.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.109.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.109.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.109.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.109.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.109.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.11.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.11.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.11.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.11.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.11.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.11.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.110.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.110.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.110.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.110.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.110.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.110.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.111.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.111.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.111.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.111.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.111.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.111.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.112.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.112.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.112.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.112.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.112.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.112.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.113.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.113.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.113.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.113.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.113.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.113.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.114.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.114.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.114.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.114.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.114.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.114.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.115.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.115.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.115.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.115.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.115.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.115.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.116.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.116.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.116.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.116.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.116.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.116.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.117.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.117.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.117.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.117.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.117.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.117.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.118.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.118.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.118.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.118.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.118.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.118.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.119.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.119.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.119.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.119.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.119.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.119.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.12.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.12.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.12.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.12.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.12.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.12.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.120.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.120.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.120.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.120.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.120.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.120.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.121.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.121.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.121.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.121.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.121.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.121.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.122.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.122.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.122.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.122.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.122.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.122.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.123.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.123.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.123.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.123.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.123.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.123.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.124.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.124.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.124.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.124.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.124.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.124.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.125.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.125.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.125.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.125.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.125.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.125.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.126.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.126.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.126.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.126.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.126.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.126.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.127.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.127.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.127.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.127.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.127.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.127.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.128.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.128.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.128.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.128.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.128.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.128.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.129.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.129.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.129.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.129.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.129.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.129.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.13.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.13.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.13.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.13.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.13.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.13.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.130.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.130.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.130.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.130.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.130.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.130.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.131.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.131.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.131.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.131.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.131.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.131.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.132.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.132.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.132.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.132.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.132.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.132.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.133.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.133.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.133.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.133.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.133.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.133.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.134.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.134.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.134.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.134.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.134.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.134.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.135.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.135.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.135.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.135.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.135.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.135.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.136.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.136.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.136.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.136.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.136.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.136.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.137.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.137.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.137.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.137.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.137.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.137.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.138.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.138.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.138.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.138.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.138.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.138.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.139.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.139.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.139.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.139.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.139.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.139.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.14.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.14.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.14.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.14.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.14.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.14.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.140.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.140.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.140.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.140.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.140.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.140.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.141.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.141.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.141.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.141.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.141.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.141.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.142.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.142.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.142.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.142.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.142.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.142.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.143.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.143.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.143.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.143.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.143.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.143.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.144.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.144.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.144.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.144.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.144.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.144.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.145.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.145.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.145.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.145.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.145.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.145.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.146.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.146.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.146.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.146.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.146.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.146.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.147.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.147.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.147.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.147.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.147.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.147.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.148.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.148.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.148.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.148.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.148.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.148.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.149.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.149.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.149.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.149.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.149.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.149.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.15.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.15.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.15.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.15.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.15.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.15.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.150.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.150.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.150.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.150.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.150.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.150.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.151.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.151.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.151.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.151.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.151.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.151.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.152.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.152.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.152.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.152.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.152.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.152.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.153.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.153.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.153.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.153.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.153.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.153.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.154.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.154.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.154.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.154.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.154.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.154.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.155.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.155.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.155.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.155.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.155.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.155.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.156.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.156.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.156.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.156.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.156.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.156.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.157.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.157.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.157.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.157.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.157.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.157.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.158.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.158.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.158.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.158.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.158.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.158.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.159.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.159.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.159.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.159.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.159.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.159.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.16.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.16.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.16.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.16.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.16.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.16.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.17.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.17.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.17.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.17.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.17.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.17.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.18.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.18.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.18.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.18.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.18.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.18.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.19.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.19.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.19.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.19.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.19.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.19.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.2.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.2.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.2.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.2.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.2.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.2.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.20.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.20.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.20.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.20.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.20.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.20.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.21.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.21.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.21.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.21.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.21.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.21.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.22.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.22.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.22.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.22.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.22.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.22.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.23.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.23.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.23.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.23.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.23.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.23.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.24.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.24.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.24.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.24.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.24.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.24.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.25.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.25.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.25.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.25.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.25.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.25.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.26.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.26.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.26.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.26.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.26.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.26.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.27.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.27.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.27.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.27.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.27.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.27.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.28.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.28.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.28.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.28.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.28.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.28.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.29.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.29.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.29.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.29.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.29.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.29.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.3.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.3.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.3.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.3.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.3.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.3.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.30.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.30.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.30.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.30.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.30.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.30.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.31.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.31.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.31.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.31.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.31.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.31.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.32.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.32.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.32.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.32.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.32.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.32.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.33.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.33.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.33.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.33.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.33.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.33.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.34.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.34.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.34.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.34.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.34.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.34.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.35.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.35.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.35.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.35.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.35.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.35.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.36.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.36.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.36.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.36.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.36.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.36.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.37.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.37.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.37.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.37.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.37.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.37.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.38.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.38.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.38.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.38.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.38.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.38.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.39.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.39.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.39.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.39.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.39.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.39.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.4.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.4.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.4.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.4.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.4.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.4.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.40.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.40.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.40.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.40.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.40.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.40.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.41.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.41.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.41.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.41.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.41.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.41.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.42.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.42.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.42.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.42.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.42.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.42.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.43.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.43.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.43.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.43.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.43.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.43.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.44.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.44.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.44.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.44.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.44.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.44.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.45.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.45.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.45.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.45.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.45.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.45.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.46.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.46.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.46.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.46.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.46.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.46.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.47.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.47.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.47.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.47.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.47.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.47.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.48.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.48.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.48.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.48.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.48.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.48.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.49.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.49.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.49.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.49.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.49.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.49.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.5.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.5.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.5.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.5.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.5.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.5.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.50.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.50.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.50.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.50.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.50.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.50.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.51.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.51.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.51.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.51.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.51.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.51.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.52.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.52.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.52.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.52.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.52.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.52.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.53.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.53.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.53.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.53.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.53.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.53.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.54.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.54.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.54.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.54.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.54.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.54.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.55.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.55.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.55.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.55.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.55.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.55.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.56.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.56.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.56.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.56.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.56.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.56.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.57.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.57.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.57.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.57.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.57.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.57.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.58.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.58.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.58.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.58.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.58.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.58.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.59.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.59.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.59.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.59.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.59.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.59.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.6.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.6.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.6.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.6.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.6.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.6.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.60.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.60.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.60.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.60.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.60.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.60.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.61.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.61.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.61.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.61.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.61.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.61.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.62.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.62.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.62.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.62.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.62.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.62.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.63.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.63.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.63.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.63.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.63.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.63.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.64.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.64.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.64.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.64.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.64.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.64.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.65.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.65.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.65.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.65.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.65.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.65.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.66.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.66.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.66.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.66.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.66.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.66.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.67.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.67.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.67.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.67.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.67.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.67.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.68.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.68.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.68.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.68.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.68.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.68.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.69.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.69.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.69.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.69.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.69.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.69.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.7.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.7.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.7.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.7.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.7.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.7.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.70.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.70.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.70.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.70.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.70.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.70.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.71.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.71.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.71.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.71.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.71.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.71.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.72.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.72.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.72.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.72.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.72.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.72.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.73.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.73.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.73.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.73.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.73.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.73.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.74.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.74.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.74.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.74.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.74.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.74.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.75.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.75.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.75.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.75.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.75.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.75.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.76.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.76.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.76.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.76.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.76.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.76.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.77.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.77.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.77.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.77.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.77.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.77.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.78.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.78.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.78.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.78.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.78.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.78.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.79.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.79.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.79.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.79.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.79.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.79.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.8.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.8.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.8.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.8.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.8.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.8.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.80.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.80.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.80.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.80.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.80.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.80.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.81.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.81.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.81.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.81.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.81.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.81.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.82.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.82.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.82.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.82.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.82.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.82.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.83.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.83.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.83.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.83.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.83.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.83.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.84.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.84.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.84.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.84.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.84.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.84.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.85.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.85.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.85.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.85.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.85.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.85.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.86.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.86.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.86.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.86.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.86.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.86.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.87.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.87.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.87.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.87.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.87.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.87.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.88.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.88.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.88.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.88.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.88.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.88.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.89.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.89.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.89.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.89.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.89.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.89.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.9.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.9.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.9.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.9.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.9.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.9.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.90.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.90.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.90.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.90.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.90.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.90.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.91.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.91.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.91.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.91.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.91.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.91.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.92.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.92.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.92.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.92.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.92.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.92.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.93.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.93.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.93.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.93.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.93.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.93.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.94.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.94.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.94.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.94.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.94.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.94.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.95.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.95.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.95.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.95.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.95.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.95.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.96.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.96.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.96.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.96.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.96.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.96.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.97.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.97.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.97.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.97.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.97.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.97.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.98.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.98.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.98.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.98.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.98.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.98.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.99.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.99.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.99.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.99.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.99.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.experts.99.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.gate.e_score_correction_bias": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.gate.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.shared_experts.down_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.shared_experts.down_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.shared_experts.gate_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.shared_experts.gate_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.shared_experts.up_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.mlp.shared_experts.up_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.post_attention_layernorm.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.self_attn.k_norm.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.self_attn.k_proj.bias": "model-00044-of-00092.safetensors",
+ "model.layers.43.self_attn.k_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.self_attn.k_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.self_attn.o_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.self_attn.o_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.self_attn.q_norm.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.self_attn.q_proj.bias": "model-00044-of-00092.safetensors",
+ "model.layers.43.self_attn.q_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.self_attn.q_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.43.self_attn.v_proj.bias": "model-00044-of-00092.safetensors",
+ "model.layers.43.self_attn.v_proj.weight": "model-00044-of-00092.safetensors",
+ "model.layers.43.self_attn.v_proj.weight_scale": "model-00044-of-00092.safetensors",
+ "model.layers.44.input_layernorm.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.0.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.0.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.0.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.0.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.0.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.0.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.1.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.1.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.1.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.1.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.1.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.1.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.10.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.10.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.10.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.10.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.10.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.10.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.100.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.100.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.100.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.100.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.100.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.100.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.101.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.101.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.101.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.101.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.101.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.101.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.102.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.102.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.102.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.102.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.102.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.102.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.103.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.103.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.103.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.103.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.103.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.103.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.104.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.104.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.104.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.104.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.104.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.104.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.105.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.105.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.105.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.105.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.105.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.105.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.106.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.106.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.106.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.106.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.106.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.106.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.107.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.107.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.107.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.107.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.107.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.107.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.108.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.108.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.108.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.108.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.108.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.108.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.109.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.109.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.109.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.109.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.109.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.109.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.11.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.11.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.11.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.11.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.11.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.11.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.110.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.110.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.110.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.110.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.110.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.110.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.111.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.111.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.111.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.111.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.111.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.111.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.112.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.112.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.112.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.112.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.112.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.112.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.113.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.113.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.113.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.113.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.113.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.113.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.114.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.114.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.114.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.114.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.114.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.114.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.115.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.115.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.115.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.115.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.115.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.115.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.116.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.116.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.116.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.116.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.116.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.116.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.117.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.117.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.117.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.117.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.117.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.117.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.118.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.118.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.118.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.118.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.118.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.118.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.119.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.119.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.119.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.119.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.119.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.119.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.12.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.12.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.12.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.12.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.12.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.12.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.120.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.120.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.120.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.120.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.120.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.120.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.121.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.121.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.121.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.121.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.121.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.121.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.122.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.122.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.122.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.122.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.122.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.122.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.123.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.123.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.123.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.123.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.123.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.123.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.124.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.124.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.124.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.124.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.124.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.124.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.125.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.125.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.125.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.125.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.125.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.125.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.126.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.126.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.126.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.126.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.126.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.126.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.127.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.127.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.127.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.127.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.127.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.127.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.128.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.128.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.128.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.128.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.128.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.128.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.129.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.129.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.129.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.129.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.129.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.129.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.13.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.13.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.13.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.13.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.13.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.13.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.130.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.130.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.130.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.130.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.130.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.130.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.131.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.131.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.131.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.131.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.131.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.131.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.132.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.132.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.132.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.132.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.132.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.132.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.133.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.133.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.133.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.133.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.133.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.133.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.134.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.134.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.134.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.134.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.134.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.134.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.135.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.135.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.135.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.135.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.135.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.135.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.136.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.136.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.136.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.136.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.136.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.136.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.137.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.137.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.137.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.137.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.137.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.137.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.138.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.138.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.138.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.138.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.138.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.138.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.139.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.139.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.139.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.139.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.139.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.139.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.14.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.14.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.14.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.14.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.14.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.14.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.140.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.140.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.140.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.140.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.140.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.140.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.141.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.141.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.141.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.141.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.141.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.141.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.142.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.142.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.142.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.142.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.142.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.142.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.143.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.143.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.143.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.143.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.143.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.143.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.144.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.144.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.144.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.144.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.144.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.144.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.145.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.145.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.145.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.145.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.145.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.145.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.146.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.146.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.146.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.146.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.146.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.146.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.147.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.147.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.147.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.147.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.147.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.147.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.148.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.148.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.148.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.148.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.148.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.148.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.149.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.149.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.149.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.149.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.149.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.149.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.15.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.15.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.15.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.15.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.15.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.15.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.150.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.150.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.150.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.150.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.150.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.150.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.151.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.151.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.151.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.151.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.151.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.151.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.152.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.152.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.152.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.152.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.152.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.152.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.153.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.153.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.153.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.153.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.153.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.153.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.154.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.154.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.154.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.154.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.154.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.154.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.155.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.155.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.155.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.155.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.155.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.155.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.156.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.156.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.156.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.156.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.156.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.156.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.157.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.157.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.157.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.157.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.157.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.157.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.158.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.158.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.158.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.158.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.158.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.158.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.159.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.159.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.159.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.159.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.159.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.159.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.16.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.16.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.16.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.16.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.16.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.16.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.17.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.17.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.17.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.17.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.17.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.17.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.18.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.18.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.18.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.18.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.18.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.18.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.19.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.19.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.19.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.19.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.19.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.19.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.2.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.2.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.2.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.2.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.2.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.2.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.20.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.20.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.20.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.20.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.20.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.20.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.21.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.21.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.21.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.21.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.21.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.21.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.22.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.22.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.22.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.22.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.22.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.22.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.23.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.23.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.23.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.23.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.23.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.23.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.24.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.24.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.24.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.24.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.24.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.24.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.25.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.25.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.25.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.25.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.25.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.25.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.26.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.26.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.26.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.26.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.26.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.26.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.27.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.27.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.27.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.27.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.27.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.27.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.28.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.28.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.28.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.28.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.28.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.28.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.29.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.29.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.29.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.29.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.29.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.29.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.3.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.3.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.3.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.3.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.3.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.3.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.30.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.30.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.30.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.30.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.30.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.30.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.31.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.31.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.31.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.31.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.31.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.31.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.32.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.32.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.32.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.32.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.32.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.32.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.33.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.33.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.33.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.33.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.33.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.33.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.34.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.34.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.34.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.34.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.34.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.34.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.35.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.35.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.35.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.35.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.35.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.35.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.36.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.36.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.36.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.36.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.36.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.36.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.37.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.37.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.37.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.37.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.37.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.37.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.38.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.38.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.38.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.38.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.38.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.38.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.39.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.39.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.39.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.39.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.39.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.39.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.4.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.4.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.4.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.4.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.4.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.4.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.40.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.40.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.40.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.40.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.40.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.40.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.41.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.41.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.41.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.41.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.41.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.41.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.42.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.42.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.42.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.42.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.42.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.42.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.43.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.43.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.43.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.43.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.43.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.43.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.44.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.44.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.44.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.44.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.44.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.44.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.45.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.45.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.45.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.45.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.45.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.45.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.46.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.46.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.46.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.46.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.46.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.46.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.47.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.47.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.47.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.47.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.47.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.47.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.48.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.48.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.48.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.48.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.48.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.48.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.49.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.49.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.49.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.49.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.49.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.49.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.5.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.5.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.5.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.5.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.5.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.5.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.50.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.50.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.50.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.50.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.50.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.50.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.51.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.51.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.51.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.51.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.51.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.51.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.52.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.52.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.52.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.52.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.52.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.52.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.53.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.53.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.53.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.53.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.53.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.53.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.54.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.54.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.54.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.54.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.54.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.54.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.55.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.55.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.55.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.55.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.55.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.55.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.56.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.56.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.56.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.56.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.56.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.56.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.57.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.57.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.57.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.57.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.57.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.57.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.58.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.58.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.58.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.58.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.58.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.58.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.59.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.59.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.59.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.59.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.59.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.59.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.6.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.6.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.6.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.6.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.6.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.6.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.60.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.60.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.60.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.60.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.60.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.60.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.61.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.61.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.61.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.61.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.61.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.61.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.62.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.62.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.62.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.62.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.62.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.62.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.63.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.63.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.63.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.63.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.63.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.63.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.64.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.64.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.64.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.64.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.64.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.64.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.65.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.65.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.65.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.65.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.65.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.65.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.66.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.66.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.66.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.66.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.66.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.66.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.67.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.67.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.67.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.67.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.67.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.67.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.68.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.68.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.68.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.68.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.68.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.68.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.69.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.69.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.69.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.69.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.69.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.69.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.7.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.7.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.7.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.7.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.7.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.7.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.70.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.70.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.70.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.70.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.70.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.70.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.71.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.71.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.71.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.71.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.71.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.71.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.72.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.72.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.72.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.72.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.72.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.72.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.73.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.73.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.73.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.73.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.73.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.73.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.74.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.74.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.74.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.74.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.74.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.74.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.75.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.75.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.75.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.75.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.75.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.75.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.76.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.76.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.76.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.76.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.76.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.76.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.77.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.77.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.77.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.77.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.77.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.77.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.78.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.78.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.78.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.78.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.78.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.78.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.79.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.79.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.79.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.79.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.79.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.79.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.8.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.8.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.8.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.8.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.8.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.8.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.80.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.80.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.80.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.80.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.80.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.80.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.81.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.81.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.81.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.81.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.81.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.81.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.82.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.82.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.82.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.82.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.82.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.82.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.83.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.83.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.83.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.83.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.83.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.83.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.84.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.84.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.84.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.84.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.84.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.84.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.85.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.85.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.85.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.85.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.85.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.85.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.86.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.86.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.86.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.86.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.86.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.86.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.87.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.87.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.87.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.87.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.87.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.87.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.88.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.88.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.88.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.88.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.88.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.88.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.89.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.89.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.89.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.89.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.89.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.89.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.9.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.9.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.9.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.9.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.9.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.9.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.90.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.90.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.90.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.90.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.90.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.90.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.91.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.91.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.91.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.91.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.91.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.91.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.92.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.92.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.92.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.92.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.92.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.92.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.93.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.93.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.93.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.93.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.93.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.93.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.94.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.94.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.94.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.94.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.94.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.94.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.95.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.95.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.95.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.95.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.95.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.95.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.96.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.96.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.96.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.96.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.96.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.96.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.97.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.97.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.97.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.97.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.97.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.97.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.98.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.98.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.98.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.98.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.98.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.98.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.99.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.99.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.99.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.99.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.99.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.experts.99.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.gate.e_score_correction_bias": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.gate.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.shared_experts.down_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.shared_experts.down_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.shared_experts.gate_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.shared_experts.gate_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.shared_experts.up_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.mlp.shared_experts.up_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.post_attention_layernorm.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.self_attn.k_norm.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.self_attn.k_proj.bias": "model-00045-of-00092.safetensors",
+ "model.layers.44.self_attn.k_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.self_attn.k_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.self_attn.o_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.self_attn.o_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.self_attn.q_norm.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.self_attn.q_proj.bias": "model-00045-of-00092.safetensors",
+ "model.layers.44.self_attn.q_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.self_attn.q_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.44.self_attn.v_proj.bias": "model-00045-of-00092.safetensors",
+ "model.layers.44.self_attn.v_proj.weight": "model-00045-of-00092.safetensors",
+ "model.layers.44.self_attn.v_proj.weight_scale": "model-00045-of-00092.safetensors",
+ "model.layers.45.input_layernorm.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.0.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.0.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.0.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.0.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.0.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.0.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.1.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.1.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.1.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.1.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.1.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.1.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.10.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.10.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.10.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.10.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.10.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.10.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.100.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.100.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.100.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.100.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.100.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.100.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.101.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.101.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.101.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.101.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.101.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.101.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.102.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.102.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.102.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.102.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.102.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.102.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.103.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.103.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.103.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.103.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.103.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.103.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.104.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.104.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.104.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.104.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.104.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.104.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.105.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.105.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.105.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.105.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.105.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.105.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.106.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.106.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.106.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.106.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.106.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.106.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.107.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.107.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.107.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.107.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.107.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.107.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.108.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.108.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.108.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.108.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.108.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.108.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.109.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.109.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.109.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.109.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.109.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.109.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.11.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.11.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.11.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.11.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.11.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.11.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.110.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.110.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.110.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.110.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.110.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.110.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.111.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.111.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.111.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.111.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.111.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.111.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.112.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.112.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.112.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.112.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.112.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.112.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.113.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.113.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.113.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.113.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.113.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.113.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.114.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.114.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.114.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.114.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.114.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.114.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.115.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.115.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.115.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.115.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.115.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.115.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.116.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.116.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.116.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.116.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.116.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.116.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.117.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.117.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.117.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.117.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.117.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.117.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.118.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.118.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.118.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.118.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.118.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.118.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.119.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.119.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.119.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.119.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.119.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.119.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.12.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.12.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.12.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.12.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.12.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.12.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.120.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.120.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.120.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.120.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.120.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.120.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.121.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.121.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.121.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.121.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.121.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.121.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.122.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.122.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.122.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.122.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.122.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.122.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.123.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.123.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.123.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.123.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.123.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.123.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.124.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.124.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.124.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.124.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.124.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.124.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.125.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.125.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.125.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.125.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.125.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.125.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.126.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.126.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.126.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.126.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.126.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.126.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.127.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.127.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.127.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.127.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.127.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.127.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.128.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.128.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.128.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.128.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.128.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.128.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.129.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.129.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.129.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.129.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.129.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.129.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.13.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.13.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.13.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.13.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.13.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.13.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.130.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.130.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.130.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.130.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.130.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.130.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.131.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.131.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.131.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.131.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.131.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.131.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.132.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.132.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.132.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.132.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.132.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.132.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.133.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.133.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.133.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.133.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.133.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.133.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.134.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.134.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.134.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.134.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.134.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.134.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.135.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.135.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.135.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.135.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.135.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.135.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.136.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.136.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.136.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.136.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.136.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.136.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.137.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.137.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.137.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.137.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.137.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.137.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.138.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.138.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.138.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.138.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.138.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.138.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.139.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.139.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.139.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.139.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.139.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.139.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.14.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.14.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.14.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.14.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.14.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.14.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.140.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.140.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.140.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.140.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.140.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.140.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.141.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.141.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.141.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.141.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.141.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.141.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.142.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.142.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.142.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.142.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.142.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.142.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.143.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.143.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.143.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.143.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.143.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.143.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.144.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.144.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.144.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.144.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.144.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.144.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.145.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.145.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.145.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.145.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.145.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.145.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.146.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.146.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.146.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.146.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.146.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.146.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.147.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.147.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.147.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.147.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.147.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.147.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.148.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.148.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.148.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.148.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.148.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.148.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.149.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.149.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.149.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.149.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.149.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.149.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.15.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.15.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.15.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.15.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.15.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.15.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.150.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.150.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.150.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.150.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.150.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.150.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.151.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.151.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.151.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.151.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.151.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.151.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.152.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.152.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.152.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.152.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.152.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.152.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.153.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.153.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.153.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.153.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.153.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.153.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.154.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.154.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.154.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.154.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.154.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.154.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.155.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.155.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.155.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.155.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.155.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.155.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.156.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.156.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.156.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.156.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.156.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.156.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.157.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.157.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.157.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.157.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.157.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.157.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.158.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.158.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.158.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.158.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.158.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.158.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.159.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.159.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.159.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.159.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.159.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.159.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.16.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.16.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.16.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.16.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.16.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.16.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.17.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.17.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.17.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.17.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.17.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.17.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.18.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.18.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.18.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.18.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.18.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.18.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.19.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.19.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.19.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.19.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.19.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.19.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.2.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.2.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.2.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.2.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.2.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.2.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.20.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.20.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.20.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.20.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.20.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.20.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.21.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.21.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.21.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.21.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.21.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.21.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.22.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.22.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.22.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.22.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.22.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.22.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.23.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.23.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.23.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.23.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.23.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.23.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.24.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.24.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.24.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.24.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.24.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.24.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.25.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.25.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.25.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.25.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.25.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.25.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.26.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.26.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.26.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.26.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.26.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.26.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.27.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.27.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.27.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.27.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.27.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.27.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.28.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.28.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.28.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.28.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.28.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.28.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.29.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.29.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.29.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.29.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.29.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.29.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.3.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.3.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.3.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.3.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.3.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.3.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.30.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.30.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.30.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.30.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.30.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.30.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.31.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.31.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.31.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.31.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.31.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.31.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.32.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.32.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.32.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.32.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.32.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.32.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.33.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.33.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.33.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.33.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.33.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.33.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.34.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.34.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.34.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.34.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.34.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.34.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.35.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.35.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.35.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.35.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.35.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.35.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.36.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.36.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.36.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.36.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.36.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.36.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.37.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.37.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.37.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.37.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.37.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.37.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.38.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.38.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.38.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.38.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.38.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.38.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.39.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.39.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.39.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.39.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.39.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.39.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.4.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.4.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.4.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.4.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.4.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.4.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.40.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.40.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.40.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.40.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.40.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.40.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.41.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.41.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.41.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.41.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.41.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.41.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.42.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.42.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.42.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.42.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.42.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.42.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.43.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.43.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.43.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.43.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.43.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.43.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.44.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.44.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.44.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.44.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.44.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.44.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.45.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.45.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.45.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.45.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.45.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.45.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.46.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.46.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.46.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.46.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.46.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.46.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.47.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.47.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.47.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.47.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.47.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.47.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.48.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.48.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.48.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.48.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.48.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.48.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.49.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.49.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.49.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.49.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.49.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.49.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.5.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.5.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.5.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.5.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.5.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.5.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.50.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.50.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.50.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.50.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.50.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.50.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.51.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.51.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.51.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.51.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.51.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.51.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.52.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.52.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.52.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.52.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.52.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.52.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.53.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.53.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.53.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.53.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.53.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.53.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.54.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.54.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.54.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.54.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.54.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.54.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.55.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.55.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.55.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.55.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.55.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.55.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.56.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.56.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.56.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.56.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.56.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.56.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.57.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.57.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.57.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.57.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.57.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.57.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.58.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.58.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.58.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.58.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.58.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.58.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.59.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.59.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.59.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.59.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.59.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.59.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.6.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.6.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.6.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.6.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.6.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.6.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.60.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.60.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.60.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.60.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.60.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.60.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.61.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.61.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.61.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.61.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.61.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.61.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.62.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.62.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.62.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.62.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.62.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.62.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.63.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.63.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.63.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.63.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.63.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.63.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.64.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.64.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.64.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.64.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.64.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.64.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.65.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.65.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.65.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.65.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.65.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.65.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.66.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.66.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.66.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.66.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.66.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.66.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.67.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.67.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.67.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.67.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.67.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.67.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.68.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.68.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.68.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.68.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.68.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.68.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.69.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.69.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.69.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.69.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.69.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.69.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.7.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.7.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.7.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.7.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.7.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.7.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.70.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.70.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.70.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.70.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.70.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.70.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.71.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.71.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.71.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.71.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.71.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.71.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.72.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.72.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.72.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.72.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.72.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.72.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.73.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.73.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.73.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.73.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.73.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.73.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.74.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.74.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.74.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.74.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.74.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.74.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.75.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.75.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.75.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.75.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.75.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.75.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.76.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.76.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.76.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.76.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.76.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.76.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.77.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.77.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.77.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.77.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.77.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.77.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.78.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.78.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.78.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.78.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.78.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.78.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.79.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.79.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.79.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.79.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.79.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.79.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.8.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.8.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.8.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.8.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.8.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.8.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.80.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.80.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.80.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.80.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.80.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.80.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.81.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.81.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.81.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.81.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.81.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.81.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.82.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.82.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.82.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.82.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.82.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.82.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.83.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.83.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.83.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.83.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.83.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.83.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.84.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.84.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.84.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.84.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.84.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.84.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.85.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.85.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.85.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.85.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.85.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.85.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.86.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.86.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.86.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.86.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.86.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.86.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.87.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.87.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.87.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.87.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.87.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.87.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.88.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.88.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.88.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.88.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.88.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.88.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.89.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.89.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.89.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.89.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.89.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.89.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.9.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.9.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.9.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.9.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.9.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.9.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.90.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.90.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.90.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.90.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.90.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.90.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.91.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.91.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.91.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.91.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.91.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.91.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.92.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.92.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.92.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.92.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.92.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.92.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.93.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.93.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.93.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.93.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.93.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.93.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.94.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.94.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.94.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.94.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.94.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.94.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.95.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.95.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.95.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.95.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.95.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.95.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.96.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.96.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.96.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.96.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.96.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.96.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.97.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.97.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.97.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.97.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.97.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.97.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.98.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.98.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.98.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.98.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.98.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.98.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.99.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.99.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.99.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.99.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.99.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.experts.99.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.gate.e_score_correction_bias": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.gate.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.shared_experts.down_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.shared_experts.down_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.shared_experts.gate_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.shared_experts.gate_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.shared_experts.up_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.mlp.shared_experts.up_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.post_attention_layernorm.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.self_attn.k_norm.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.self_attn.k_proj.bias": "model-00046-of-00092.safetensors",
+ "model.layers.45.self_attn.k_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.self_attn.k_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.self_attn.o_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.self_attn.o_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.self_attn.q_norm.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.self_attn.q_proj.bias": "model-00046-of-00092.safetensors",
+ "model.layers.45.self_attn.q_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.self_attn.q_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.45.self_attn.v_proj.bias": "model-00046-of-00092.safetensors",
+ "model.layers.45.self_attn.v_proj.weight": "model-00046-of-00092.safetensors",
+ "model.layers.45.self_attn.v_proj.weight_scale": "model-00046-of-00092.safetensors",
+ "model.layers.46.input_layernorm.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.0.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.0.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.0.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.0.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.0.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.0.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.1.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.1.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.1.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.1.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.1.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.1.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.10.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.10.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.10.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.10.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.10.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.10.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.100.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.100.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.100.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.100.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.100.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.100.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.101.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.101.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.101.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.101.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.101.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.101.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.102.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.102.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.102.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.102.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.102.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.102.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.103.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.103.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.103.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.103.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.103.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.103.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.104.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.104.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.104.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.104.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.104.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.104.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.105.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.105.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.105.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.105.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.105.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.105.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.106.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.106.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.106.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.106.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.106.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.106.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.107.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.107.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.107.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.107.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.107.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.107.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.108.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.108.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.108.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.108.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.108.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.108.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.109.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.109.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.109.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.109.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.109.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.109.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.11.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.11.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.11.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.11.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.11.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.11.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.110.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.110.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.110.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.110.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.110.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.110.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.111.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.111.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.111.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.111.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.111.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.111.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.112.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.112.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.112.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.112.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.112.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.112.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.113.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.113.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.113.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.113.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.113.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.113.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.114.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.114.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.114.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.114.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.114.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.114.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.115.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.115.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.115.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.115.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.115.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.115.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.116.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.116.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.116.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.116.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.116.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.116.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.117.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.117.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.117.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.117.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.117.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.117.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.118.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.118.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.118.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.118.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.118.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.118.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.119.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.119.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.119.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.119.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.119.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.119.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.12.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.12.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.12.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.12.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.12.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.12.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.120.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.120.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.120.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.120.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.120.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.120.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.121.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.121.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.121.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.121.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.121.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.121.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.122.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.122.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.122.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.122.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.122.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.122.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.123.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.123.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.123.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.123.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.123.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.123.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.124.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.124.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.124.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.124.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.124.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.124.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.125.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.125.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.125.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.125.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.125.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.125.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.126.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.126.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.126.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.126.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.126.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.126.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.127.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.127.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.127.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.127.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.127.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.127.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.128.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.128.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.128.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.128.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.128.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.128.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.129.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.129.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.129.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.129.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.129.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.129.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.13.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.13.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.13.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.13.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.13.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.13.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.130.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.130.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.130.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.130.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.130.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.130.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.131.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.131.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.131.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.131.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.131.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.131.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.132.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.132.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.132.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.132.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.132.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.132.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.133.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.133.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.133.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.133.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.133.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.133.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.134.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.134.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.134.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.134.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.134.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.134.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.135.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.135.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.135.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.135.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.135.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.135.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.136.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.136.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.136.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.136.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.136.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.136.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.137.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.137.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.137.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.137.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.137.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.137.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.138.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.138.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.138.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.138.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.138.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.138.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.139.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.139.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.139.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.139.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.139.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.139.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.14.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.14.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.14.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.14.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.14.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.14.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.140.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.140.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.140.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.140.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.140.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.140.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.141.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.141.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.141.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.141.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.141.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.141.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.142.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.142.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.142.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.142.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.142.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.142.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.143.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.143.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.143.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.143.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.143.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.143.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.144.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.144.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.144.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.144.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.144.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.144.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.145.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.145.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.145.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.145.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.145.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.145.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.146.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.146.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.146.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.146.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.146.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.146.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.147.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.147.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.147.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.147.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.147.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.147.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.148.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.148.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.148.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.148.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.148.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.148.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.149.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.149.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.149.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.149.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.149.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.149.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.15.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.15.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.15.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.15.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.15.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.15.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.150.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.150.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.150.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.150.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.150.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.150.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.151.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.151.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.151.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.151.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.151.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.151.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.152.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.152.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.152.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.152.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.152.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.152.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.153.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.153.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.153.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.153.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.153.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.153.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.154.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.154.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.154.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.154.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.154.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.154.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.155.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.155.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.155.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.155.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.155.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.155.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.156.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.156.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.156.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.156.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.156.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.156.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.157.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.157.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.157.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.157.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.157.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.157.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.158.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.158.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.158.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.158.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.158.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.158.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.159.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.159.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.159.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.159.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.159.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.159.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.16.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.16.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.16.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.16.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.16.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.16.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.17.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.17.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.17.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.17.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.17.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.17.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.18.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.18.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.18.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.18.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.18.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.18.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.19.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.19.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.19.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.19.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.19.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.19.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.2.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.2.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.2.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.2.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.2.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.2.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.20.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.20.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.20.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.20.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.20.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.20.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.21.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.21.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.21.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.21.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.21.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.21.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.22.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.22.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.22.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.22.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.22.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.22.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.23.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.23.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.23.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.23.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.23.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.23.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.24.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.24.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.24.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.24.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.24.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.24.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.25.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.25.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.25.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.25.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.25.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.25.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.26.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.26.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.26.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.26.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.26.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.26.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.27.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.27.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.27.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.27.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.27.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.27.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.28.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.28.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.28.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.28.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.28.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.28.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.29.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.29.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.29.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.29.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.29.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.29.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.3.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.3.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.3.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.3.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.3.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.3.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.30.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.30.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.30.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.30.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.30.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.30.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.31.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.31.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.31.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.31.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.31.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.31.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.32.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.32.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.32.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.32.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.32.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.32.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.33.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.33.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.33.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.33.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.33.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.33.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.34.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.34.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.34.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.34.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.34.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.34.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.35.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.35.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.35.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.35.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.35.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.35.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.36.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.36.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.36.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.36.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.36.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.36.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.37.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.37.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.37.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.37.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.37.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.37.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.38.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.38.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.38.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.38.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.38.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.38.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.39.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.39.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.39.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.39.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.39.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.39.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.4.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.4.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.4.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.4.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.4.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.4.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.40.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.40.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.40.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.40.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.40.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.40.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.41.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.41.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.41.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.41.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.41.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.41.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.42.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.42.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.42.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.42.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.42.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.42.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.43.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.43.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.43.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.43.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.43.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.43.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.44.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.44.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.44.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.44.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.44.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.44.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.45.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.45.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.45.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.45.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.45.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.45.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.46.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.46.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.46.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.46.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.46.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.46.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.47.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.47.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.47.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.47.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.47.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.47.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.48.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.48.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.48.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.48.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.48.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.48.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.49.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.49.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.49.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.49.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.49.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.49.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.5.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.5.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.5.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.5.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.5.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.5.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.50.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.50.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.50.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.50.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.50.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.50.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.51.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.51.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.51.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.51.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.51.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.51.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.52.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.52.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.52.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.52.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.52.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.52.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.53.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.53.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.53.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.53.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.53.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.53.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.54.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.54.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.54.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.54.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.54.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.54.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.55.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.55.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.55.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.55.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.55.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.55.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.56.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.56.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.56.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.56.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.56.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.56.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.57.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.57.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.57.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.57.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.57.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.57.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.58.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.58.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.58.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.58.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.58.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.58.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.59.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.59.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.59.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.59.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.59.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.59.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.6.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.6.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.6.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.6.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.6.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.6.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.60.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.60.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.60.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.60.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.60.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.60.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.61.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.61.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.61.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.61.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.61.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.61.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.62.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.62.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.62.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.62.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.62.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.62.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.63.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.63.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.63.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.63.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.63.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.63.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.64.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.64.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.64.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.64.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.64.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.64.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.65.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.65.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.65.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.65.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.65.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.65.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.66.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.66.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.66.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.66.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.66.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.66.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.67.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.67.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.67.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.67.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.67.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.67.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.68.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.68.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.68.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.68.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.68.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.68.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.69.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.69.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.69.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.69.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.69.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.69.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.7.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.7.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.7.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.7.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.7.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.7.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.70.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.70.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.70.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.70.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.70.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.70.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.71.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.71.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.71.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.71.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.71.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.71.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.72.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.72.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.72.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.72.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.72.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.72.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.73.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.73.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.73.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.73.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.73.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.73.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.74.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.74.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.74.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.74.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.74.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.74.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.75.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.75.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.75.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.75.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.75.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.75.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.76.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.76.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.76.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.76.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.76.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.76.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.77.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.77.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.77.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.77.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.77.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.77.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.78.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.78.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.78.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.78.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.78.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.78.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.79.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.79.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.79.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.79.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.79.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.79.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.8.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.8.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.8.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.8.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.8.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.8.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.80.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.80.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.80.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.80.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.80.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.80.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.81.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.81.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.81.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.81.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.81.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.81.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.82.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.82.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.82.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.82.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.82.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.82.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.83.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.83.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.83.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.83.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.83.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.83.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.84.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.84.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.84.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.84.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.84.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.84.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.85.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.85.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.85.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.85.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.85.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.85.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.86.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.86.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.86.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.86.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.86.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.86.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.87.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.87.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.87.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.87.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.87.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.87.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.88.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.88.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.88.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.88.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.88.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.88.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.89.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.89.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.89.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.89.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.89.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.89.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.9.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.9.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.9.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.9.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.9.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.9.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.90.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.90.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.90.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.90.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.90.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.90.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.91.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.91.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.91.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.91.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.91.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.91.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.92.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.92.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.92.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.92.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.92.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.92.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.93.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.93.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.93.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.93.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.93.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.93.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.94.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.94.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.94.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.94.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.94.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.94.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.95.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.95.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.95.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.95.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.95.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.95.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.96.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.96.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.96.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.96.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.96.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.96.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.97.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.97.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.97.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.97.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.97.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.97.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.98.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.98.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.98.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.98.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.98.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.98.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.99.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.99.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.99.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.99.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.99.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.experts.99.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.gate.e_score_correction_bias": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.gate.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.shared_experts.down_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.shared_experts.down_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.shared_experts.gate_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.shared_experts.gate_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.shared_experts.up_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.mlp.shared_experts.up_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.post_attention_layernorm.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.self_attn.k_norm.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.self_attn.k_proj.bias": "model-00047-of-00092.safetensors",
+ "model.layers.46.self_attn.k_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.self_attn.k_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.self_attn.o_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.self_attn.o_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.self_attn.q_norm.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.self_attn.q_proj.bias": "model-00047-of-00092.safetensors",
+ "model.layers.46.self_attn.q_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.self_attn.q_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.46.self_attn.v_proj.bias": "model-00047-of-00092.safetensors",
+ "model.layers.46.self_attn.v_proj.weight": "model-00047-of-00092.safetensors",
+ "model.layers.46.self_attn.v_proj.weight_scale": "model-00047-of-00092.safetensors",
+ "model.layers.47.input_layernorm.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.0.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.0.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.0.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.0.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.0.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.0.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.1.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.1.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.1.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.1.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.1.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.1.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.10.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.10.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.10.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.10.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.10.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.10.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.100.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.100.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.100.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.100.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.100.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.100.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.101.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.101.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.101.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.101.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.101.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.101.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.102.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.102.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.102.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.102.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.102.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.102.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.103.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.103.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.103.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.103.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.103.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.103.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.104.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.104.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.104.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.104.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.104.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.104.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.105.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.105.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.105.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.105.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.105.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.105.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.106.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.106.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.106.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.106.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.106.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.106.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.107.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.107.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.107.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.107.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.107.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.107.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.108.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.108.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.108.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.108.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.108.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.108.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.109.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.109.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.109.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.109.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.109.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.109.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.11.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.11.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.11.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.11.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.11.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.11.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.110.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.110.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.110.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.110.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.110.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.110.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.111.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.111.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.111.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.111.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.111.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.111.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.112.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.112.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.112.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.112.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.112.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.112.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.113.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.113.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.113.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.113.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.113.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.113.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.114.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.114.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.114.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.114.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.114.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.114.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.115.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.115.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.115.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.115.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.115.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.115.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.116.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.116.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.116.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.116.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.116.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.116.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.117.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.117.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.117.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.117.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.117.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.117.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.118.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.118.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.118.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.118.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.118.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.118.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.119.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.119.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.119.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.119.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.119.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.119.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.12.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.12.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.12.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.12.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.12.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.12.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.120.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.120.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.120.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.120.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.120.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.120.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.121.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.121.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.121.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.121.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.121.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.121.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.122.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.122.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.122.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.122.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.122.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.122.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.123.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.123.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.123.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.123.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.123.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.123.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.124.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.124.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.124.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.124.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.124.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.124.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.125.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.125.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.125.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.125.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.125.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.125.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.126.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.126.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.126.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.126.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.126.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.126.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.127.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.127.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.127.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.127.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.127.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.127.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.128.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.128.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.128.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.128.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.128.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.128.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.129.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.129.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.129.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.129.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.129.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.129.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.13.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.13.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.13.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.13.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.13.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.13.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.130.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.130.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.130.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.130.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.130.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.130.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.131.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.131.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.131.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.131.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.131.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.131.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.132.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.132.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.132.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.132.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.132.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.132.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.133.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.133.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.133.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.133.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.133.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.133.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.134.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.134.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.134.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.134.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.134.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.134.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.135.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.135.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.135.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.135.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.135.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.135.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.136.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.136.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.136.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.136.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.136.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.136.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.137.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.137.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.137.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.137.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.137.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.137.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.138.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.138.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.138.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.138.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.138.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.138.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.139.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.139.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.139.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.139.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.139.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.139.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.14.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.14.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.14.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.14.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.14.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.14.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.140.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.140.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.140.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.140.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.140.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.140.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.141.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.141.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.141.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.141.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.141.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.141.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.142.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.142.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.142.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.142.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.142.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.142.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.143.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.143.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.143.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.143.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.143.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.143.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.144.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.144.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.144.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.144.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.144.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.144.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.145.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.145.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.145.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.145.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.145.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.145.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.146.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.146.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.146.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.146.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.146.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.146.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.147.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.147.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.147.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.147.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.147.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.147.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.148.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.148.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.148.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.148.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.148.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.148.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.149.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.149.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.149.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.149.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.149.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.149.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.15.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.15.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.15.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.15.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.15.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.15.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.150.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.150.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.150.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.150.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.150.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.150.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.151.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.151.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.151.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.151.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.151.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.151.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.152.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.152.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.152.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.152.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.152.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.152.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.153.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.153.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.153.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.153.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.153.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.153.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.154.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.154.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.154.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.154.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.154.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.154.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.155.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.155.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.155.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.155.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.155.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.155.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.156.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.156.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.156.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.156.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.156.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.156.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.157.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.157.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.157.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.157.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.157.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.157.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.158.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.158.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.158.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.158.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.158.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.158.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.159.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.159.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.159.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.159.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.159.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.159.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.16.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.16.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.16.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.16.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.16.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.16.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.17.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.17.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.17.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.17.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.17.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.17.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.18.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.18.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.18.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.18.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.18.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.18.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.19.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.19.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.19.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.19.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.19.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.19.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.2.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.2.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.2.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.2.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.2.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.2.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.20.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.20.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.20.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.20.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.20.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.20.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.21.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.21.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.21.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.21.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.21.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.21.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.22.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.22.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.22.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.22.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.22.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.22.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.23.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.23.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.23.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.23.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.23.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.23.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.24.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.24.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.24.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.24.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.24.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.24.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.25.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.25.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.25.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.25.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.25.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.25.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.26.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.26.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.26.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.26.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.26.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.26.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.27.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.27.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.27.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.27.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.27.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.27.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.28.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.28.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.28.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.28.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.28.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.28.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.29.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.29.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.29.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.29.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.29.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.29.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.3.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.3.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.3.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.3.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.3.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.3.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.30.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.30.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.30.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.30.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.30.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.30.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.31.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.31.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.31.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.31.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.31.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.31.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.32.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.32.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.32.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.32.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.32.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.32.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.33.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.33.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.33.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.33.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.33.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.33.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.34.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.34.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.34.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.34.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.34.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.34.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.35.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.35.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.35.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.35.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.35.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.35.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.36.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.36.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.36.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.36.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.36.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.36.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.37.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.37.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.37.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.37.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.37.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.37.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.38.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.38.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.38.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.38.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.38.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.38.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.39.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.39.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.39.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.39.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.39.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.39.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.4.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.4.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.4.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.4.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.4.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.4.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.40.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.40.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.40.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.40.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.40.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.40.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.41.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.41.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.41.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.41.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.41.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.41.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.42.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.42.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.42.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.42.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.42.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.42.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.43.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.43.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.43.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.43.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.43.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.43.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.44.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.44.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.44.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.44.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.44.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.44.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.45.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.45.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.45.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.45.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.45.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.45.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.46.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.46.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.46.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.46.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.46.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.46.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.47.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.47.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.47.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.47.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.47.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.47.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.48.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.48.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.48.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.48.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.48.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.48.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.49.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.49.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.49.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.49.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.49.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.49.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.5.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.5.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.5.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.5.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.5.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.5.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.50.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.50.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.50.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.50.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.50.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.50.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.51.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.51.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.51.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.51.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.51.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.51.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.52.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.52.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.52.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.52.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.52.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.52.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.53.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.53.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.53.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.53.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.53.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.53.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.54.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.54.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.54.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.54.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.54.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.54.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.55.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.55.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.55.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.55.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.55.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.55.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.56.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.56.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.56.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.56.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.56.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.56.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.57.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.57.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.57.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.57.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.57.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.57.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.58.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.58.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.58.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.58.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.58.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.58.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.59.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.59.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.59.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.59.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.59.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.59.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.6.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.6.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.6.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.6.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.6.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.6.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.60.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.60.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.60.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.60.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.60.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.60.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.61.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.61.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.61.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.61.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.61.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.61.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.62.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.62.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.62.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.62.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.62.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.62.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.63.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.63.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.63.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.63.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.63.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.63.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.64.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.64.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.64.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.64.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.64.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.64.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.65.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.65.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.65.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.65.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.65.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.65.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.66.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.66.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.66.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.66.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.66.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.66.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.67.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.67.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.67.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.67.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.67.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.67.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.68.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.68.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.68.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.68.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.68.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.68.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.69.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.69.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.69.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.69.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.69.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.69.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.7.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.7.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.7.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.7.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.7.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.7.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.70.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.70.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.70.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.70.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.70.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.70.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.71.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.71.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.71.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.71.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.71.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.71.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.72.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.72.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.72.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.72.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.72.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.72.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.73.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.73.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.73.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.73.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.73.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.73.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.74.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.74.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.74.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.74.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.74.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.74.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.75.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.75.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.75.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.75.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.75.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.75.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.76.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.76.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.76.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.76.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.76.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.76.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.77.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.77.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.77.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.77.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.77.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.77.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.78.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.78.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.78.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.78.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.78.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.78.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.79.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.79.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.79.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.79.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.79.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.79.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.8.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.8.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.8.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.8.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.8.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.8.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.80.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.80.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.80.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.80.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.80.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.80.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.81.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.81.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.81.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.81.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.81.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.81.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.82.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.82.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.82.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.82.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.82.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.82.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.83.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.83.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.83.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.83.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.83.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.83.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.84.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.84.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.84.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.84.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.84.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.84.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.85.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.85.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.85.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.85.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.85.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.85.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.86.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.86.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.86.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.86.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.86.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.86.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.87.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.87.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.87.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.87.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.87.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.87.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.88.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.88.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.88.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.88.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.88.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.88.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.89.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.89.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.89.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.89.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.89.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.89.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.9.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.9.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.9.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.9.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.9.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.9.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.90.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.90.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.90.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.90.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.90.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.90.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.91.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.91.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.91.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.91.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.91.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.91.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.92.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.92.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.92.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.92.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.92.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.92.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.93.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.93.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.93.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.93.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.93.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.93.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.94.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.94.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.94.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.94.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.94.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.94.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.95.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.95.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.95.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.95.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.95.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.95.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.96.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.96.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.96.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.96.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.96.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.96.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.97.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.97.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.97.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.97.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.97.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.97.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.98.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.98.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.98.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.98.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.98.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.98.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.99.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.99.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.99.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.99.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.99.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.experts.99.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.gate.e_score_correction_bias": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.gate.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.shared_experts.down_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.shared_experts.down_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.shared_experts.gate_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.shared_experts.gate_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.shared_experts.up_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.mlp.shared_experts.up_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.post_attention_layernorm.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.self_attn.k_norm.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.self_attn.k_proj.bias": "model-00048-of-00092.safetensors",
+ "model.layers.47.self_attn.k_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.self_attn.k_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.self_attn.o_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.self_attn.o_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.self_attn.q_norm.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.self_attn.q_proj.bias": "model-00048-of-00092.safetensors",
+ "model.layers.47.self_attn.q_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.self_attn.q_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.47.self_attn.v_proj.bias": "model-00048-of-00092.safetensors",
+ "model.layers.47.self_attn.v_proj.weight": "model-00048-of-00092.safetensors",
+ "model.layers.47.self_attn.v_proj.weight_scale": "model-00048-of-00092.safetensors",
+ "model.layers.48.input_layernorm.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.0.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.0.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.0.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.0.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.0.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.0.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.1.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.1.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.1.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.1.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.1.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.1.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.10.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.10.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.10.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.10.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.10.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.10.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.100.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.100.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.100.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.100.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.100.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.100.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.101.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.101.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.101.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.101.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.101.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.101.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.102.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.102.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.102.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.102.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.102.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.102.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.103.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.103.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.103.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.103.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.103.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.103.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.104.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.104.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.104.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.104.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.104.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.104.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.105.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.105.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.105.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.105.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.105.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.105.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.106.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.106.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.106.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.106.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.106.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.106.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.107.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.107.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.107.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.107.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.107.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.107.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.108.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.108.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.108.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.108.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.108.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.108.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.109.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.109.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.109.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.109.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.109.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.109.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.11.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.11.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.11.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.11.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.11.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.11.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.110.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.110.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.110.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.110.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.110.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.110.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.111.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.111.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.111.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.111.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.111.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.111.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.112.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.112.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.112.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.112.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.112.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.112.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.113.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.113.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.113.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.113.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.113.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.113.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.114.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.114.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.114.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.114.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.114.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.114.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.115.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.115.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.115.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.115.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.115.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.115.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.116.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.116.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.116.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.116.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.116.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.116.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.117.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.117.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.117.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.117.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.117.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.117.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.118.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.118.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.118.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.118.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.118.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.118.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.119.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.119.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.119.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.119.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.119.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.119.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.12.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.12.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.12.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.12.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.12.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.12.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.120.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.120.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.120.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.120.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.120.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.120.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.121.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.121.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.121.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.121.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.121.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.121.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.122.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.122.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.122.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.122.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.122.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.122.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.123.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.123.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.123.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.123.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.123.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.123.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.124.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.124.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.124.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.124.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.124.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.124.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.125.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.125.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.125.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.125.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.125.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.125.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.126.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.126.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.126.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.126.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.126.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.126.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.127.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.127.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.127.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.127.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.127.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.127.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.128.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.128.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.128.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.128.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.128.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.128.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.129.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.129.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.129.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.129.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.129.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.129.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.13.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.13.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.13.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.13.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.13.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.13.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.130.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.130.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.130.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.130.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.130.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.130.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.131.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.131.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.131.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.131.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.131.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.131.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.132.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.132.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.132.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.132.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.132.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.132.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.133.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.133.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.133.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.133.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.133.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.133.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.134.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.134.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.134.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.134.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.134.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.134.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.135.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.135.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.135.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.135.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.135.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.135.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.136.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.136.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.136.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.136.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.136.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.136.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.137.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.137.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.137.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.137.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.137.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.137.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.138.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.138.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.138.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.138.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.138.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.138.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.139.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.139.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.139.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.139.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.139.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.139.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.14.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.14.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.14.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.14.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.14.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.14.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.140.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.140.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.140.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.140.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.140.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.140.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.141.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.141.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.141.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.141.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.141.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.141.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.142.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.142.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.142.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.142.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.142.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.142.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.143.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.143.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.143.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.143.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.143.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.143.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.144.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.144.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.144.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.144.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.144.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.144.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.145.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.145.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.145.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.145.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.145.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.145.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.146.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.146.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.146.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.146.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.146.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.146.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.147.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.147.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.147.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.147.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.147.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.147.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.148.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.148.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.148.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.148.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.148.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.148.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.149.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.149.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.149.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.149.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.149.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.149.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.15.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.15.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.15.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.15.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.15.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.15.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.150.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.150.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.150.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.150.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.150.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.150.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.151.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.151.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.151.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.151.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.151.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.151.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.152.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.152.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.152.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.152.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.152.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.152.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.153.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.153.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.153.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.153.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.153.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.153.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.154.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.154.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.154.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.154.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.154.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.154.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.155.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.155.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.155.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.155.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.155.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.155.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.156.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.156.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.156.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.156.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.156.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.156.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.157.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.157.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.157.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.157.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.157.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.157.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.158.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.158.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.158.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.158.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.158.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.158.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.159.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.159.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.159.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.159.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.159.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.159.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.16.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.16.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.16.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.16.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.16.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.16.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.17.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.17.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.17.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.17.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.17.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.17.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.18.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.18.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.18.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.18.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.18.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.18.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.19.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.19.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.19.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.19.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.19.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.19.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.2.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.2.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.2.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.2.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.2.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.2.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.20.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.20.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.20.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.20.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.20.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.20.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.21.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.21.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.21.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.21.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.21.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.21.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.22.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.22.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.22.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.22.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.22.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.22.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.23.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.23.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.23.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.23.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.23.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.23.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.24.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.24.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.24.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.24.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.24.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.24.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.25.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.25.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.25.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.25.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.25.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.25.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.26.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.26.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.26.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.26.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.26.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.26.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.27.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.27.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.27.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.27.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.27.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.27.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.28.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.28.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.28.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.28.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.28.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.28.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.29.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.29.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.29.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.29.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.29.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.29.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.3.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.3.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.3.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.3.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.3.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.3.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.30.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.30.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.30.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.30.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.30.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.30.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.31.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.31.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.31.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.31.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.31.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.31.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.32.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.32.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.32.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.32.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.32.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.32.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.33.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.33.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.33.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.33.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.33.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.33.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.34.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.34.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.34.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.34.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.34.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.34.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.35.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.35.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.35.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.35.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.35.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.35.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.36.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.36.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.36.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.36.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.36.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.36.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.37.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.37.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.37.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.37.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.37.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.37.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.38.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.38.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.38.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.38.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.38.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.38.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.39.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.39.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.39.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.39.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.39.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.39.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.4.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.4.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.4.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.4.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.4.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.4.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.40.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.40.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.40.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.40.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.40.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.40.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.41.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.41.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.41.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.41.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.41.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.41.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.42.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.42.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.42.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.42.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.42.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.42.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.43.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.43.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.43.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.43.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.43.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.43.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.44.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.44.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.44.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.44.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.44.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.44.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.45.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.45.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.45.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.45.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.45.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.45.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.46.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.46.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.46.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.46.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.46.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.46.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.47.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.47.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.47.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.47.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.47.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.47.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.48.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.48.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.48.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.48.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.48.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.48.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.49.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.49.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.49.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.49.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.49.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.49.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.5.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.5.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.5.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.5.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.5.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.5.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.50.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.50.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.50.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.50.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.50.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.50.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.51.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.51.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.51.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.51.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.51.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.51.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.52.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.52.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.52.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.52.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.52.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.52.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.53.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.53.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.53.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.53.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.53.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.53.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.54.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.54.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.54.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.54.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.54.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.54.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.55.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.55.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.55.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.55.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.55.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.55.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.56.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.56.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.56.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.56.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.56.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.56.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.57.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.57.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.57.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.57.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.57.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.57.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.58.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.58.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.58.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.58.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.58.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.58.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.59.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.59.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.59.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.59.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.59.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.59.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.6.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.6.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.6.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.6.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.6.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.6.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.60.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.60.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.60.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.60.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.60.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.60.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.61.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.61.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.61.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.61.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.61.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.61.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.62.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.62.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.62.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.62.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.62.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.62.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.63.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.63.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.63.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.63.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.63.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.63.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.64.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.64.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.64.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.64.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.64.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.64.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.65.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.65.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.65.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.65.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.65.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.65.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.66.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.66.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.66.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.66.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.66.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.66.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.67.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.67.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.67.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.67.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.67.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.67.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.68.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.68.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.68.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.68.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.68.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.68.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.69.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.69.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.69.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.69.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.69.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.69.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.7.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.7.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.7.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.7.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.7.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.7.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.70.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.70.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.70.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.70.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.70.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.70.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.71.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.71.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.71.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.71.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.71.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.71.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.72.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.72.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.72.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.72.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.72.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.72.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.73.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.73.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.73.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.73.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.73.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.73.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.74.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.74.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.74.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.74.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.74.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.74.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.75.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.75.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.75.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.75.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.75.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.75.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.76.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.76.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.76.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.76.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.76.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.76.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.77.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.77.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.77.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.77.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.77.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.77.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.78.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.78.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.78.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.78.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.78.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.78.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.79.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.79.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.79.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.79.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.79.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.79.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.8.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.8.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.8.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.8.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.8.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.8.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.80.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.80.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.80.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.80.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.80.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.80.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.81.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.81.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.81.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.81.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.81.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.81.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.82.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.82.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.82.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.82.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.82.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.82.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.83.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.83.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.83.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.83.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.83.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.83.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.84.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.84.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.84.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.84.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.84.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.84.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.85.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.85.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.85.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.85.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.85.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.85.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.86.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.86.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.86.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.86.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.86.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.86.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.87.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.87.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.87.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.87.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.87.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.87.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.88.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.88.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.88.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.88.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.88.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.88.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.89.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.89.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.89.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.89.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.89.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.89.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.9.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.9.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.9.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.9.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.9.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.9.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.90.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.90.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.90.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.90.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.90.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.90.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.91.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.91.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.91.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.91.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.91.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.91.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.92.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.92.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.92.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.92.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.92.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.92.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.93.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.93.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.93.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.93.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.93.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.93.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.94.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.94.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.94.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.94.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.94.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.94.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.95.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.95.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.95.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.95.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.95.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.95.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.96.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.96.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.96.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.96.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.96.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.96.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.97.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.97.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.97.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.97.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.97.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.97.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.98.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.98.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.98.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.98.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.98.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.98.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.99.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.99.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.99.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.99.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.99.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.experts.99.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.gate.e_score_correction_bias": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.gate.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.shared_experts.down_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.shared_experts.down_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.shared_experts.gate_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.shared_experts.gate_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.shared_experts.up_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.mlp.shared_experts.up_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.post_attention_layernorm.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.self_attn.k_norm.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.self_attn.k_proj.bias": "model-00049-of-00092.safetensors",
+ "model.layers.48.self_attn.k_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.self_attn.k_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.self_attn.o_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.self_attn.o_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.self_attn.q_norm.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.self_attn.q_proj.bias": "model-00049-of-00092.safetensors",
+ "model.layers.48.self_attn.q_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.self_attn.q_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.48.self_attn.v_proj.bias": "model-00049-of-00092.safetensors",
+ "model.layers.48.self_attn.v_proj.weight": "model-00049-of-00092.safetensors",
+ "model.layers.48.self_attn.v_proj.weight_scale": "model-00049-of-00092.safetensors",
+ "model.layers.49.input_layernorm.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.0.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.0.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.0.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.0.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.0.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.0.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.1.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.1.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.1.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.1.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.1.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.1.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.10.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.10.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.10.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.10.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.10.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.10.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.100.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.100.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.100.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.100.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.100.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.100.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.101.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.101.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.101.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.101.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.101.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.101.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.102.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.102.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.102.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.102.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.102.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.102.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.103.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.103.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.103.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.103.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.103.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.103.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.104.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.104.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.104.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.104.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.104.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.104.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.105.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.105.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.105.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.105.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.105.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.105.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.106.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.106.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.106.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.106.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.106.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.106.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.107.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.107.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.107.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.107.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.107.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.107.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.108.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.108.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.108.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.108.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.108.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.108.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.109.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.109.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.109.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.109.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.109.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.109.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.11.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.11.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.11.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.11.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.11.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.11.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.110.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.110.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.110.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.110.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.110.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.110.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.111.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.111.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.111.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.111.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.111.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.111.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.112.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.112.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.112.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.112.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.112.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.112.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.113.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.113.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.113.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.113.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.113.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.113.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.114.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.114.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.114.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.114.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.114.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.114.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.115.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.115.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.115.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.115.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.115.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.115.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.116.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.116.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.116.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.116.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.116.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.116.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.117.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.117.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.117.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.117.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.117.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.117.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.118.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.118.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.118.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.118.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.118.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.118.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.119.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.119.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.119.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.119.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.119.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.119.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.12.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.12.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.12.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.12.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.12.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.12.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.120.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.120.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.120.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.120.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.120.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.120.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.121.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.121.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.121.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.121.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.121.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.121.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.122.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.122.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.122.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.122.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.122.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.122.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.123.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.123.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.123.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.123.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.123.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.123.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.124.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.124.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.124.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.124.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.124.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.124.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.125.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.125.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.125.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.125.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.125.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.125.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.126.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.126.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.126.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.126.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.126.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.126.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.127.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.127.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.127.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.127.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.127.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.127.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.128.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.128.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.128.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.128.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.128.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.128.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.129.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.129.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.129.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.129.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.129.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.129.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.13.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.13.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.13.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.13.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.13.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.13.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.130.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.130.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.130.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.130.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.130.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.130.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.131.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.131.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.131.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.131.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.131.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.131.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.132.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.132.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.132.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.132.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.132.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.132.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.133.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.133.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.133.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.133.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.133.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.133.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.134.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.134.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.134.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.134.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.134.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.134.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.135.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.135.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.135.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.135.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.135.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.135.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.136.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.136.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.136.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.136.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.136.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.136.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.137.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.137.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.137.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.137.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.137.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.137.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.138.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.138.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.138.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.138.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.138.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.138.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.139.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.139.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.139.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.139.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.139.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.139.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.14.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.14.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.14.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.14.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.14.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.14.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.140.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.140.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.140.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.140.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.140.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.140.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.141.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.141.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.141.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.141.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.141.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.141.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.142.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.142.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.142.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.142.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.142.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.142.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.143.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.143.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.143.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.143.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.143.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.143.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.144.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.144.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.144.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.144.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.144.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.144.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.145.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.145.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.145.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.145.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.145.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.145.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.146.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.146.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.146.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.146.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.146.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.146.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.147.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.147.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.147.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.147.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.147.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.147.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.148.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.148.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.148.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.148.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.148.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.148.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.149.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.149.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.149.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.149.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.149.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.149.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.15.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.15.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.15.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.15.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.15.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.15.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.150.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.150.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.150.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.150.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.150.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.150.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.151.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.151.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.151.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.151.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.151.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.151.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.152.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.152.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.152.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.152.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.152.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.152.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.153.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.153.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.153.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.153.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.153.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.153.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.154.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.154.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.154.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.154.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.154.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.154.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.155.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.155.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.155.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.155.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.155.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.155.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.156.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.156.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.156.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.156.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.156.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.156.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.157.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.157.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.157.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.157.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.157.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.157.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.158.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.158.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.158.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.158.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.158.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.158.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.159.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.159.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.159.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.159.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.159.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.159.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.16.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.16.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.16.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.16.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.16.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.16.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.17.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.17.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.17.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.17.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.17.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.17.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.18.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.18.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.18.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.18.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.18.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.18.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.19.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.19.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.19.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.19.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.19.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.19.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.2.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.2.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.2.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.2.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.2.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.2.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.20.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.20.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.20.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.20.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.20.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.20.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.21.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.21.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.21.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.21.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.21.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.21.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.22.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.22.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.22.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.22.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.22.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.22.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.23.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.23.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.23.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.23.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.23.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.23.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.24.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.24.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.24.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.24.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.24.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.24.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.25.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.25.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.25.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.25.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.25.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.25.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.26.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.26.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.26.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.26.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.26.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.26.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.27.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.27.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.27.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.27.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.27.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.27.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.28.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.28.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.28.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.28.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.28.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.28.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.29.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.29.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.29.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.29.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.29.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.29.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.3.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.3.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.3.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.3.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.3.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.3.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.30.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.30.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.30.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.30.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.30.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.30.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.31.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.31.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.31.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.31.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.31.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.31.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.32.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.32.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.32.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.32.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.32.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.32.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.33.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.33.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.33.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.33.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.33.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.33.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.34.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.34.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.34.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.34.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.34.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.34.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.35.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.35.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.35.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.35.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.35.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.35.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.36.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.36.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.36.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.36.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.36.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.36.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.37.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.37.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.37.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.37.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.37.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.37.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.38.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.38.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.38.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.38.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.38.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.38.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.39.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.39.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.39.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.39.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.39.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.39.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.4.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.4.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.4.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.4.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.4.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.4.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.40.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.40.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.40.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.40.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.40.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.40.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.41.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.41.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.41.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.41.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.41.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.41.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.42.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.42.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.42.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.42.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.42.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.42.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.43.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.43.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.43.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.43.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.43.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.43.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.44.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.44.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.44.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.44.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.44.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.44.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.45.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.45.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.45.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.45.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.45.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.45.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.46.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.46.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.46.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.46.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.46.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.46.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.47.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.47.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.47.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.47.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.47.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.47.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.48.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.48.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.48.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.48.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.48.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.48.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.49.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.49.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.49.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.49.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.49.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.49.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.5.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.5.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.5.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.5.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.5.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.5.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.50.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.50.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.50.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.50.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.50.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.50.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.51.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.51.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.51.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.51.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.51.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.51.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.52.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.52.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.52.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.52.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.52.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.52.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.53.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.53.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.53.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.53.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.53.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.53.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.54.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.54.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.54.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.54.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.54.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.54.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.55.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.55.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.55.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.55.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.55.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.55.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.56.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.56.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.56.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.56.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.56.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.56.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.57.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.57.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.57.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.57.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.57.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.57.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.58.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.58.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.58.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.58.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.58.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.58.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.59.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.59.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.59.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.59.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.59.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.59.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.6.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.6.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.6.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.6.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.6.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.6.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.60.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.60.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.60.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.60.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.60.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.60.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.61.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.61.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.61.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.61.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.61.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.61.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.62.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.62.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.62.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.62.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.62.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.62.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.63.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.63.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.63.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.63.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.63.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.63.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.64.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.64.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.64.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.64.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.64.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.64.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.65.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.65.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.65.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.65.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.65.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.65.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.66.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.66.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.66.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.66.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.66.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.66.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.67.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.67.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.67.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.67.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.67.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.67.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.68.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.68.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.68.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.68.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.68.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.68.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.69.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.69.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.69.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.69.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.69.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.69.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.7.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.7.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.7.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.7.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.7.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.7.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.70.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.70.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.70.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.70.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.70.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.70.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.71.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.71.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.71.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.71.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.71.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.71.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.72.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.72.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.72.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.72.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.72.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.72.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.73.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.73.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.73.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.73.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.73.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.73.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.74.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.74.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.74.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.74.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.74.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.74.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.75.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.75.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.75.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.75.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.75.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.75.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.76.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.76.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.76.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.76.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.76.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.76.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.77.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.77.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.77.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.77.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.77.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.77.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.78.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.78.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.78.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.78.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.78.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.78.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.79.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.79.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.79.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.79.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.79.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.79.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.8.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.8.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.8.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.8.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.8.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.8.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.80.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.80.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.80.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.80.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.80.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.80.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.81.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.81.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.81.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.81.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.81.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.81.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.82.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.82.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.82.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.82.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.82.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.82.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.83.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.83.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.83.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.83.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.83.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.83.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.84.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.84.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.84.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.84.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.84.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.84.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.85.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.85.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.85.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.85.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.85.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.85.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.86.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.86.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.86.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.86.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.86.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.86.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.87.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.87.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.87.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.87.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.87.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.87.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.88.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.88.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.88.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.88.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.88.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.88.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.89.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.89.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.89.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.89.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.89.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.89.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.9.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.9.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.9.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.9.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.9.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.9.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.90.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.90.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.90.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.90.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.90.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.90.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.91.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.91.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.91.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.91.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.91.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.91.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.92.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.92.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.92.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.92.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.92.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.92.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.93.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.93.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.93.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.93.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.93.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.93.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.94.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.94.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.94.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.94.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.94.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.94.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.95.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.95.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.95.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.95.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.95.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.95.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.96.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.96.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.96.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.96.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.96.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.96.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.97.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.97.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.97.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.97.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.97.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.97.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.98.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.98.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.98.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.98.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.98.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.98.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.99.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.99.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.99.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.99.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.99.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.experts.99.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.gate.e_score_correction_bias": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.gate.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.shared_experts.down_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.shared_experts.down_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.shared_experts.gate_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.shared_experts.gate_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.shared_experts.up_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.mlp.shared_experts.up_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.post_attention_layernorm.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.self_attn.k_norm.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.self_attn.k_proj.bias": "model-00050-of-00092.safetensors",
+ "model.layers.49.self_attn.k_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.self_attn.k_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.self_attn.o_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.self_attn.o_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.self_attn.q_norm.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.self_attn.q_proj.bias": "model-00050-of-00092.safetensors",
+ "model.layers.49.self_attn.q_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.self_attn.q_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.49.self_attn.v_proj.bias": "model-00050-of-00092.safetensors",
+ "model.layers.49.self_attn.v_proj.weight": "model-00050-of-00092.safetensors",
+ "model.layers.49.self_attn.v_proj.weight_scale": "model-00050-of-00092.safetensors",
+ "model.layers.5.input_layernorm.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.0.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.0.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.0.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.0.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.0.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.0.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.1.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.1.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.1.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.1.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.1.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.1.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.10.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.10.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.10.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.10.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.10.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.10.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.100.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.100.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.100.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.100.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.100.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.100.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.101.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.101.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.101.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.101.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.101.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.101.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.102.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.102.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.102.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.102.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.102.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.102.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.103.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.103.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.103.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.103.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.103.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.103.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.104.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.104.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.104.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.104.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.104.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.104.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.105.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.105.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.105.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.105.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.105.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.105.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.106.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.106.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.106.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.106.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.106.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.106.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.107.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.107.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.107.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.107.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.107.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.107.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.108.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.108.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.108.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.108.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.108.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.108.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.109.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.109.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.109.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.109.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.109.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.109.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.11.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.11.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.11.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.11.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.11.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.11.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.110.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.110.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.110.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.110.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.110.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.110.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.111.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.111.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.111.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.111.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.111.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.111.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.112.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.112.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.112.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.112.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.112.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.112.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.113.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.113.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.113.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.113.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.113.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.113.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.114.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.114.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.114.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.114.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.114.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.114.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.115.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.115.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.115.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.115.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.115.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.115.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.116.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.116.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.116.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.116.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.116.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.116.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.117.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.117.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.117.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.117.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.117.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.117.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.118.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.118.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.118.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.118.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.118.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.118.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.119.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.119.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.119.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.119.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.119.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.119.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.12.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.12.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.12.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.12.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.12.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.12.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.120.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.120.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.120.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.120.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.120.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.120.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.121.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.121.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.121.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.121.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.121.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.121.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.122.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.122.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.122.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.122.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.122.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.122.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.123.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.123.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.123.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.123.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.123.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.123.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.124.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.124.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.124.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.124.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.124.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.124.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.125.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.125.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.125.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.125.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.125.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.125.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.126.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.126.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.126.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.126.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.126.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.126.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.127.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.127.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.127.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.127.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.127.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.127.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.128.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.128.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.128.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.128.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.128.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.128.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.129.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.129.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.129.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.129.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.129.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.129.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.13.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.13.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.13.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.13.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.13.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.13.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.130.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.130.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.130.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.130.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.130.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.130.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.131.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.131.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.131.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.131.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.131.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.131.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.132.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.132.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.132.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.132.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.132.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.132.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.133.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.133.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.133.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.133.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.133.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.133.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.134.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.134.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.134.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.134.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.134.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.134.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.135.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.135.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.135.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.135.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.135.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.135.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.136.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.136.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.136.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.136.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.136.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.136.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.137.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.137.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.137.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.137.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.137.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.137.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.138.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.138.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.138.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.138.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.138.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.138.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.139.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.139.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.139.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.139.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.139.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.139.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.14.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.14.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.14.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.14.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.14.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.14.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.140.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.140.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.140.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.140.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.140.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.140.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.141.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.141.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.141.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.141.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.141.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.141.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.142.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.142.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.142.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.142.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.142.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.142.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.143.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.143.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.143.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.143.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.143.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.143.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.144.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.144.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.144.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.144.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.144.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.144.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.145.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.145.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.145.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.145.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.145.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.145.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.146.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.146.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.146.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.146.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.146.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.146.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.147.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.147.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.147.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.147.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.147.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.147.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.148.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.148.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.148.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.148.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.148.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.148.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.149.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.149.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.149.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.149.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.149.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.149.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.15.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.15.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.15.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.15.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.15.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.15.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.150.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.150.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.150.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.150.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.150.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.150.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.151.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.151.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.151.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.151.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.151.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.151.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.152.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.152.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.152.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.152.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.152.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.152.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.153.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.153.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.153.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.153.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.153.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.153.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.154.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.154.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.154.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.154.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.154.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.154.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.155.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.155.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.155.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.155.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.155.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.155.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.156.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.156.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.156.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.156.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.156.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.156.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.157.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.157.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.157.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.157.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.157.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.157.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.158.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.158.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.158.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.158.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.158.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.158.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.159.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.159.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.159.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.159.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.159.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.159.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.16.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.16.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.16.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.16.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.16.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.16.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.17.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.17.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.17.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.17.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.17.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.17.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.18.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.18.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.18.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.18.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.18.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.18.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.19.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.19.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.19.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.19.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.19.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.19.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.2.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.2.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.2.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.2.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.2.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.2.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.20.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.20.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.20.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.20.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.20.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.20.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.21.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.21.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.21.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.21.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.21.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.21.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.22.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.22.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.22.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.22.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.22.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.22.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.23.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.23.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.23.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.23.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.23.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.23.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.24.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.24.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.24.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.24.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.24.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.24.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.25.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.25.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.25.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.25.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.25.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.25.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.26.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.26.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.26.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.26.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.26.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.26.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.27.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.27.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.27.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.27.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.27.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.27.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.28.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.28.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.28.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.28.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.28.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.28.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.29.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.29.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.29.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.29.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.29.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.29.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.3.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.3.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.3.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.3.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.3.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.3.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.30.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.30.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.30.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.30.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.30.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.30.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.31.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.31.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.31.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.31.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.31.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.31.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.32.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.32.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.32.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.32.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.32.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.32.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.33.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.33.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.33.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.33.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.33.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.33.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.34.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.34.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.34.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.34.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.34.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.34.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.35.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.35.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.35.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.35.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.35.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.35.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.36.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.36.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.36.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.36.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.36.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.36.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.37.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.37.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.37.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.37.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.37.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.37.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.38.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.38.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.38.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.38.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.38.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.38.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.39.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.39.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.39.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.39.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.39.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.39.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.4.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.4.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.4.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.4.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.4.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.4.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.40.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.40.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.40.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.40.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.40.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.40.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.41.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.41.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.41.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.41.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.41.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.41.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.42.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.42.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.42.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.42.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.42.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.42.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.43.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.43.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.43.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.43.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.43.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.43.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.44.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.44.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.44.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.44.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.44.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.44.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.45.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.45.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.45.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.45.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.45.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.45.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.46.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.46.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.46.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.46.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.46.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.46.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.47.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.47.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.47.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.47.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.47.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.47.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.48.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.48.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.48.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.48.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.48.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.48.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.49.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.49.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.49.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.49.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.49.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.49.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.5.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.5.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.5.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.5.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.5.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.5.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.50.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.50.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.50.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.50.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.50.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.50.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.51.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.51.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.51.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.51.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.51.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.51.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.52.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.52.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.52.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.52.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.52.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.52.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.53.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.53.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.53.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.53.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.53.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.53.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.54.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.54.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.54.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.54.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.54.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.54.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.55.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.55.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.55.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.55.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.55.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.55.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.56.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.56.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.56.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.56.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.56.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.56.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.57.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.57.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.57.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.57.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.57.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.57.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.58.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.58.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.58.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.58.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.58.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.58.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.59.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.59.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.59.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.59.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.59.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.59.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.6.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.6.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.6.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.6.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.6.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.6.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.60.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.60.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.60.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.60.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.60.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.60.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.61.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.61.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.61.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.61.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.61.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.61.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.62.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.62.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.62.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.62.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.62.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.62.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.63.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.63.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.63.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.63.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.63.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.63.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.64.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.64.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.64.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.64.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.64.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.64.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.65.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.65.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.65.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.65.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.65.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.65.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.66.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.66.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.66.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.66.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.66.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.66.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.67.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.67.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.67.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.67.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.67.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.67.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.68.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.68.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.68.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.68.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.68.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.68.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.69.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.69.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.69.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.69.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.69.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.69.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.7.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.7.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.7.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.7.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.7.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.7.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.70.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.70.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.70.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.70.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.70.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.70.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.71.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.71.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.71.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.71.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.71.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.71.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.72.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.72.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.72.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.72.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.72.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.72.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.73.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.73.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.73.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.73.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.73.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.73.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.74.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.74.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.74.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.74.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.74.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.74.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.75.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.75.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.75.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.75.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.75.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.75.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.76.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.76.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.76.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.76.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.76.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.76.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.77.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.77.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.77.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.77.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.77.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.77.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.78.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.78.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.78.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.78.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.78.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.78.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.79.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.79.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.79.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.79.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.79.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.79.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.8.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.8.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.8.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.8.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.8.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.8.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.80.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.80.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.80.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.80.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.80.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.80.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.81.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.81.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.81.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.81.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.81.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.81.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.82.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.82.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.82.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.82.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.82.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.82.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.83.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.83.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.83.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.83.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.83.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.83.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.84.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.84.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.84.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.84.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.84.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.84.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.85.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.85.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.85.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.85.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.85.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.85.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.86.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.86.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.86.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.86.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.86.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.86.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.87.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.87.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.87.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.87.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.87.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.87.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.88.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.88.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.88.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.88.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.88.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.88.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.89.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.89.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.89.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.89.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.89.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.89.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.9.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.9.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.9.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.9.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.9.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.9.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.90.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.90.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.90.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.90.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.90.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.90.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.91.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.91.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.91.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.91.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.91.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.91.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.92.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.92.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.92.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.92.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.92.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.92.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.93.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.93.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.93.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.93.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.93.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.93.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.94.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.94.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.94.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.94.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.94.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.94.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.95.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.95.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.95.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.95.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.95.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.95.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.96.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.96.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.96.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.96.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.96.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.96.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.97.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.97.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.97.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.97.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.97.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.97.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.98.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.98.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.98.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.98.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.98.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.98.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.99.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.99.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.99.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.99.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.99.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.experts.99.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.gate.e_score_correction_bias": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.gate.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.shared_experts.down_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.shared_experts.down_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.shared_experts.gate_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.shared_experts.gate_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.shared_experts.up_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.mlp.shared_experts.up_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.post_attention_layernorm.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.self_attn.k_norm.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.self_attn.k_proj.bias": "model-00006-of-00092.safetensors",
+ "model.layers.5.self_attn.k_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.self_attn.k_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.self_attn.o_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.self_attn.o_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.self_attn.q_norm.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.self_attn.q_proj.bias": "model-00006-of-00092.safetensors",
+ "model.layers.5.self_attn.q_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.self_attn.q_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.5.self_attn.v_proj.bias": "model-00006-of-00092.safetensors",
+ "model.layers.5.self_attn.v_proj.weight": "model-00006-of-00092.safetensors",
+ "model.layers.5.self_attn.v_proj.weight_scale": "model-00006-of-00092.safetensors",
+ "model.layers.50.input_layernorm.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.0.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.0.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.0.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.0.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.0.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.0.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.1.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.1.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.1.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.1.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.1.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.1.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.10.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.10.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.10.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.10.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.10.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.10.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.100.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.100.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.100.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.100.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.100.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.100.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.101.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.101.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.101.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.101.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.101.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.101.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.102.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.102.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.102.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.102.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.102.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.102.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.103.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.103.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.103.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.103.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.103.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.103.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.104.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.104.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.104.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.104.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.104.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.104.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.105.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.105.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.105.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.105.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.105.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.105.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.106.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.106.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.106.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.106.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.106.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.106.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.107.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.107.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.107.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.107.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.107.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.107.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.108.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.108.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.108.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.108.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.108.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.108.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.109.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.109.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.109.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.109.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.109.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.109.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.11.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.11.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.11.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.11.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.11.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.11.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.110.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.110.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.110.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.110.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.110.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.110.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.111.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.111.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.111.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.111.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.111.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.111.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.112.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.112.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.112.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.112.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.112.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.112.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.113.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.113.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.113.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.113.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.113.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.113.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.114.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.114.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.114.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.114.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.114.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.114.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.115.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.115.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.115.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.115.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.115.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.115.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.116.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.116.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.116.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.116.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.116.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.116.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.117.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.117.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.117.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.117.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.117.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.117.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.118.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.118.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.118.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.118.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.118.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.118.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.119.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.119.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.119.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.119.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.119.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.119.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.12.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.12.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.12.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.12.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.12.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.12.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.120.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.120.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.120.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.120.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.120.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.120.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.121.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.121.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.121.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.121.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.121.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.121.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.122.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.122.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.122.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.122.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.122.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.122.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.123.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.123.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.123.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.123.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.123.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.123.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.124.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.124.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.124.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.124.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.124.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.124.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.125.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.125.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.125.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.125.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.125.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.125.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.126.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.126.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.126.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.126.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.126.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.126.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.127.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.127.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.127.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.127.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.127.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.127.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.128.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.128.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.128.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.128.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.128.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.128.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.129.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.129.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.129.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.129.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.129.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.129.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.13.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.13.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.13.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.13.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.13.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.13.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.130.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.130.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.130.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.130.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.130.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.130.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.131.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.131.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.131.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.131.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.131.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.131.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.132.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.132.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.132.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.132.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.132.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.132.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.133.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.133.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.133.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.133.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.133.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.133.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.134.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.134.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.134.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.134.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.134.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.134.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.135.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.135.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.135.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.135.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.135.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.135.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.136.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.136.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.136.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.136.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.136.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.136.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.137.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.137.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.137.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.137.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.137.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.137.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.138.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.138.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.138.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.138.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.138.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.138.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.139.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.139.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.139.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.139.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.139.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.139.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.14.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.14.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.14.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.14.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.14.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.14.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.140.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.140.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.140.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.140.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.140.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.140.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.141.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.141.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.141.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.141.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.141.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.141.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.142.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.142.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.142.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.142.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.142.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.142.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.143.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.143.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.143.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.143.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.143.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.143.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.144.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.144.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.144.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.144.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.144.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.144.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.145.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.145.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.145.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.145.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.145.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.145.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.146.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.146.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.146.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.146.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.146.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.146.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.147.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.147.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.147.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.147.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.147.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.147.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.148.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.148.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.148.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.148.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.148.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.148.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.149.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.149.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.149.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.149.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.149.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.149.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.15.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.15.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.15.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.15.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.15.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.15.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.150.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.150.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.150.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.150.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.150.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.150.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.151.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.151.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.151.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.151.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.151.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.151.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.152.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.152.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.152.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.152.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.152.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.152.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.153.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.153.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.153.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.153.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.153.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.153.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.154.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.154.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.154.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.154.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.154.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.154.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.155.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.155.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.155.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.155.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.155.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.155.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.156.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.156.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.156.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.156.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.156.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.156.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.157.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.157.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.157.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.157.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.157.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.157.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.158.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.158.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.158.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.158.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.158.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.158.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.159.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.159.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.159.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.159.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.159.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.159.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.16.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.16.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.16.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.16.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.16.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.16.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.17.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.17.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.17.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.17.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.17.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.17.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.18.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.18.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.18.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.18.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.18.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.18.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.19.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.19.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.19.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.19.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.19.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.19.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.2.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.2.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.2.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.2.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.2.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.2.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.20.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.20.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.20.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.20.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.20.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.20.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.21.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.21.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.21.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.21.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.21.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.21.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.22.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.22.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.22.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.22.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.22.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.22.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.23.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.23.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.23.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.23.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.23.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.23.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.24.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.24.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.24.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.24.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.24.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.24.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.25.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.25.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.25.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.25.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.25.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.25.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.26.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.26.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.26.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.26.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.26.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.26.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.27.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.27.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.27.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.27.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.27.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.27.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.28.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.28.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.28.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.28.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.28.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.28.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.29.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.29.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.29.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.29.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.29.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.29.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.3.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.3.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.3.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.3.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.3.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.3.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.30.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.30.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.30.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.30.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.30.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.30.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.31.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.31.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.31.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.31.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.31.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.31.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.32.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.32.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.32.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.32.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.32.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.32.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.33.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.33.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.33.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.33.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.33.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.33.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.34.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.34.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.34.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.34.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.34.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.34.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.35.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.35.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.35.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.35.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.35.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.35.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.36.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.36.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.36.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.36.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.36.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.36.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.37.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.37.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.37.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.37.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.37.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.37.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.38.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.38.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.38.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.38.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.38.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.38.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.39.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.39.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.39.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.39.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.39.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.39.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.4.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.4.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.4.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.4.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.4.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.4.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.40.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.40.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.40.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.40.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.40.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.40.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.41.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.41.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.41.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.41.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.41.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.41.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.42.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.42.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.42.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.42.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.42.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.42.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.43.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.43.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.43.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.43.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.43.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.43.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.44.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.44.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.44.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.44.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.44.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.44.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.45.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.45.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.45.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.45.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.45.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.45.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.46.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.46.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.46.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.46.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.46.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.46.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.47.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.47.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.47.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.47.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.47.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.47.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.48.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.48.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.48.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.48.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.48.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.48.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.49.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.49.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.49.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.49.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.49.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.49.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.5.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.5.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.5.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.5.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.5.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.5.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.50.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.50.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.50.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.50.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.50.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.50.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.51.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.51.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.51.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.51.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.51.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.51.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.52.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.52.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.52.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.52.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.52.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.52.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.53.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.53.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.53.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.53.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.53.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.53.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.54.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.54.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.54.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.54.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.54.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.54.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.55.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.55.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.55.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.55.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.55.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.55.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.56.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.56.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.56.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.56.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.56.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.56.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.57.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.57.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.57.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.57.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.57.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.57.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.58.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.58.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.58.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.58.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.58.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.58.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.59.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.59.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.59.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.59.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.59.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.59.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.6.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.6.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.6.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.6.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.6.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.6.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.60.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.60.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.60.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.60.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.60.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.60.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.61.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.61.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.61.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.61.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.61.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.61.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.62.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.62.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.62.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.62.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.62.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.62.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.63.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.63.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.63.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.63.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.63.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.63.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.64.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.64.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.64.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.64.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.64.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.64.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.65.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.65.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.65.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.65.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.65.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.65.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.66.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.66.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.66.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.66.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.66.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.66.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.67.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.67.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.67.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.67.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.67.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.67.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.68.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.68.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.68.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.68.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.68.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.68.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.69.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.69.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.69.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.69.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.69.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.69.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.7.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.7.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.7.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.7.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.7.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.7.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.70.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.70.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.70.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.70.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.70.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.70.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.71.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.71.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.71.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.71.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.71.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.71.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.72.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.72.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.72.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.72.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.72.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.72.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.73.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.73.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.73.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.73.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.73.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.73.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.74.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.74.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.74.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.74.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.74.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.74.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.75.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.75.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.75.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.75.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.75.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.75.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.76.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.76.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.76.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.76.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.76.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.76.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.77.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.77.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.77.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.77.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.77.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.77.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.78.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.78.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.78.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.78.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.78.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.78.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.79.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.79.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.79.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.79.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.79.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.79.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.8.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.8.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.8.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.8.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.8.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.8.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.80.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.80.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.80.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.80.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.80.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.80.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.81.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.81.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.81.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.81.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.81.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.81.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.82.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.82.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.82.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.82.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.82.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.82.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.83.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.83.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.83.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.83.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.83.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.83.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.84.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.84.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.84.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.84.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.84.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.84.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.85.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.85.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.85.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.85.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.85.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.85.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.86.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.86.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.86.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.86.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.86.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.86.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.87.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.87.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.87.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.87.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.87.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.87.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.88.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.88.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.88.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.88.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.88.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.88.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.89.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.89.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.89.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.89.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.89.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.89.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.9.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.9.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.9.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.9.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.9.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.9.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.90.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.90.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.90.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.90.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.90.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.90.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.91.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.91.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.91.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.91.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.91.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.91.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.92.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.92.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.92.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.92.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.92.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.92.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.93.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.93.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.93.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.93.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.93.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.93.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.94.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.94.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.94.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.94.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.94.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.94.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.95.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.95.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.95.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.95.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.95.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.95.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.96.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.96.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.96.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.96.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.96.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.96.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.97.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.97.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.97.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.97.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.97.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.97.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.98.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.98.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.98.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.98.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.98.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.98.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.99.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.99.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.99.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.99.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.99.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.experts.99.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.gate.e_score_correction_bias": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.gate.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.shared_experts.down_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.shared_experts.down_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.shared_experts.gate_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.shared_experts.gate_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.shared_experts.up_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.mlp.shared_experts.up_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.post_attention_layernorm.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.self_attn.k_norm.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.self_attn.k_proj.bias": "model-00051-of-00092.safetensors",
+ "model.layers.50.self_attn.k_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.self_attn.k_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.self_attn.o_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.self_attn.o_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.self_attn.q_norm.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.self_attn.q_proj.bias": "model-00051-of-00092.safetensors",
+ "model.layers.50.self_attn.q_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.self_attn.q_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.50.self_attn.v_proj.bias": "model-00051-of-00092.safetensors",
+ "model.layers.50.self_attn.v_proj.weight": "model-00051-of-00092.safetensors",
+ "model.layers.50.self_attn.v_proj.weight_scale": "model-00051-of-00092.safetensors",
+ "model.layers.51.input_layernorm.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.0.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.0.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.0.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.0.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.0.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.0.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.1.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.1.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.1.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.1.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.1.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.1.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.10.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.10.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.10.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.10.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.10.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.10.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.100.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.100.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.100.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.100.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.100.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.100.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.101.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.101.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.101.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.101.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.101.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.101.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.102.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.102.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.102.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.102.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.102.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.102.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.103.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.103.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.103.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.103.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.103.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.103.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.104.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.104.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.104.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.104.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.104.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.104.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.105.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.105.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.105.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.105.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.105.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.105.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.106.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.106.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.106.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.106.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.106.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.106.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.107.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.107.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.107.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.107.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.107.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.107.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.108.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.108.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.108.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.108.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.108.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.108.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.109.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.109.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.109.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.109.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.109.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.109.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.11.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.11.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.11.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.11.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.11.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.11.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.110.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.110.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.110.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.110.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.110.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.110.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.111.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.111.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.111.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.111.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.111.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.111.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.112.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.112.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.112.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.112.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.112.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.112.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.113.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.113.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.113.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.113.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.113.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.113.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.114.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.114.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.114.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.114.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.114.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.114.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.115.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.115.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.115.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.115.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.115.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.115.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.116.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.116.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.116.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.116.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.116.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.116.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.117.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.117.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.117.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.117.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.117.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.117.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.118.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.118.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.118.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.118.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.118.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.118.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.119.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.119.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.119.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.119.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.119.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.119.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.12.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.12.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.12.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.12.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.12.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.12.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.120.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.120.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.120.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.120.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.120.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.120.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.121.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.121.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.121.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.121.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.121.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.121.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.122.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.122.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.122.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.122.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.122.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.122.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.123.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.123.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.123.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.123.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.123.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.123.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.124.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.124.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.124.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.124.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.124.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.124.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.125.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.125.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.125.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.125.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.125.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.125.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.126.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.126.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.126.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.126.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.126.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.126.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.127.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.127.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.127.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.127.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.127.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.127.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.128.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.128.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.128.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.128.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.128.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.128.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.129.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.129.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.129.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.129.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.129.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.129.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.13.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.13.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.13.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.13.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.13.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.13.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.130.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.130.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.130.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.130.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.130.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.130.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.131.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.131.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.131.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.131.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.131.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.131.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.132.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.132.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.132.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.132.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.132.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.132.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.133.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.133.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.133.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.133.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.133.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.133.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.134.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.134.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.134.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.134.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.134.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.134.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.135.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.135.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.135.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.135.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.135.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.135.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.136.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.136.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.136.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.136.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.136.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.136.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.137.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.137.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.137.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.137.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.137.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.137.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.138.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.138.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.138.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.138.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.138.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.138.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.139.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.139.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.139.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.139.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.139.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.139.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.14.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.14.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.14.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.14.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.14.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.14.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.140.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.140.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.140.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.140.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.140.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.140.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.141.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.141.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.141.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.141.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.141.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.141.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.142.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.142.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.142.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.142.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.142.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.142.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.143.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.143.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.143.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.143.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.143.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.143.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.144.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.144.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.144.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.144.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.144.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.144.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.145.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.145.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.145.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.145.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.145.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.145.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.146.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.146.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.146.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.146.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.146.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.146.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.147.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.147.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.147.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.147.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.147.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.147.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.148.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.148.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.148.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.148.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.148.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.148.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.149.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.149.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.149.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.149.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.149.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.149.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.15.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.15.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.15.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.15.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.15.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.15.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.150.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.150.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.150.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.150.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.150.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.150.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.151.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.151.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.151.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.151.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.151.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.151.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.152.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.152.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.152.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.152.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.152.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.152.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.153.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.153.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.153.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.153.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.153.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.153.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.154.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.154.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.154.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.154.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.154.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.154.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.155.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.155.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.155.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.155.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.155.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.155.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.156.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.156.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.156.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.156.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.156.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.156.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.157.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.157.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.157.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.157.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.157.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.157.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.158.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.158.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.158.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.158.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.158.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.158.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.159.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.159.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.159.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.159.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.159.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.159.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.16.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.16.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.16.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.16.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.16.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.16.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.17.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.17.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.17.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.17.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.17.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.17.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.18.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.18.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.18.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.18.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.18.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.18.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.19.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.19.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.19.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.19.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.19.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.19.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.2.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.2.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.2.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.2.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.2.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.2.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.20.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.20.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.20.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.20.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.20.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.20.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.21.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.21.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.21.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.21.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.21.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.21.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.22.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.22.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.22.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.22.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.22.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.22.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.23.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.23.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.23.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.23.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.23.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.23.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.24.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.24.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.24.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.24.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.24.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.24.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.25.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.25.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.25.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.25.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.25.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.25.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.26.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.26.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.26.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.26.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.26.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.26.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.27.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.27.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.27.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.27.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.27.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.27.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.28.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.28.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.28.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.28.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.28.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.28.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.29.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.29.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.29.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.29.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.29.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.29.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.3.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.3.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.3.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.3.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.3.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.3.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.30.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.30.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.30.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.30.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.30.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.30.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.31.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.31.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.31.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.31.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.31.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.31.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.32.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.32.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.32.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.32.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.32.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.32.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.33.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.33.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.33.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.33.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.33.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.33.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.34.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.34.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.34.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.34.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.34.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.34.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.35.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.35.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.35.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.35.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.35.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.35.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.36.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.36.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.36.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.36.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.36.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.36.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.37.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.37.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.37.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.37.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.37.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.37.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.38.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.38.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.38.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.38.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.38.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.38.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.39.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.39.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.39.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.39.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.39.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.39.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.4.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.4.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.4.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.4.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.4.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.4.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.40.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.40.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.40.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.40.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.40.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.40.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.41.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.41.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.41.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.41.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.41.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.41.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.42.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.42.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.42.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.42.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.42.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.42.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.43.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.43.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.43.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.43.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.43.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.43.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.44.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.44.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.44.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.44.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.44.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.44.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.45.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.45.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.45.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.45.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.45.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.45.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.46.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.46.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.46.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.46.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.46.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.46.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.47.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.47.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.47.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.47.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.47.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.47.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.48.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.48.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.48.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.48.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.48.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.48.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.49.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.49.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.49.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.49.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.49.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.49.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.5.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.5.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.5.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.5.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.5.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.5.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.50.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.50.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.50.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.50.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.50.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.50.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.51.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.51.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.51.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.51.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.51.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.51.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.52.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.52.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.52.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.52.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.52.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.52.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.53.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.53.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.53.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.53.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.53.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.53.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.54.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.54.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.54.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.54.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.54.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.54.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.55.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.55.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.55.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.55.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.55.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.55.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.56.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.56.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.56.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.56.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.56.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.56.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.57.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.57.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.57.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.57.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.57.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.57.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.58.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.58.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.58.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.58.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.58.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.58.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.59.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.59.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.59.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.59.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.59.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.59.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.6.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.6.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.6.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.6.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.6.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.6.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.60.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.60.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.60.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.60.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.60.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.60.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.61.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.61.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.61.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.61.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.61.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.61.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.62.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.62.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.62.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.62.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.62.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.62.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.63.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.63.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.63.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.63.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.63.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.63.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.64.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.64.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.64.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.64.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.64.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.64.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.65.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.65.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.65.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.65.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.65.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.65.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.66.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.66.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.66.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.66.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.66.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.66.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.67.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.67.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.67.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.67.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.67.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.67.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.68.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.68.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.68.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.68.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.68.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.68.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.69.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.69.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.69.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.69.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.69.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.69.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.7.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.7.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.7.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.7.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.7.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.7.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.70.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.70.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.70.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.70.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.70.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.70.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.71.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.71.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.71.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.71.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.71.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.71.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.72.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.72.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.72.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.72.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.72.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.72.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.73.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.73.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.73.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.73.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.73.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.73.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.74.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.74.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.74.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.74.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.74.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.74.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.75.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.75.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.75.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.75.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.75.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.75.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.76.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.76.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.76.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.76.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.76.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.76.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.77.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.77.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.77.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.77.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.77.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.77.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.78.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.78.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.78.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.78.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.78.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.78.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.79.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.79.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.79.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.79.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.79.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.79.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.8.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.8.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.8.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.8.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.8.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.8.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.80.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.80.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.80.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.80.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.80.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.80.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.81.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.81.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.81.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.81.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.81.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.81.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.82.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.82.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.82.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.82.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.82.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.82.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.83.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.83.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.83.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.83.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.83.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.83.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.84.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.84.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.84.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.84.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.84.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.84.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.85.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.85.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.85.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.85.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.85.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.85.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.86.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.86.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.86.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.86.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.86.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.86.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.87.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.87.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.87.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.87.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.87.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.87.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.88.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.88.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.88.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.88.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.88.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.88.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.89.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.89.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.89.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.89.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.89.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.89.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.9.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.9.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.9.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.9.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.9.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.9.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.90.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.90.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.90.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.90.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.90.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.90.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.91.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.91.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.91.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.91.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.91.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.91.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.92.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.92.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.92.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.92.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.92.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.92.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.93.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.93.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.93.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.93.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.93.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.93.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.94.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.94.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.94.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.94.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.94.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.94.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.95.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.95.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.95.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.95.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.95.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.95.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.96.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.96.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.96.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.96.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.96.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.96.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.97.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.97.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.97.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.97.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.97.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.97.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.98.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.98.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.98.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.98.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.98.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.98.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.99.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.99.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.99.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.99.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.99.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.experts.99.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.gate.e_score_correction_bias": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.gate.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.shared_experts.down_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.shared_experts.down_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.shared_experts.gate_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.shared_experts.gate_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.shared_experts.up_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.mlp.shared_experts.up_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.post_attention_layernorm.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.self_attn.k_norm.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.self_attn.k_proj.bias": "model-00052-of-00092.safetensors",
+ "model.layers.51.self_attn.k_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.self_attn.k_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.self_attn.o_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.self_attn.o_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.self_attn.q_norm.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.self_attn.q_proj.bias": "model-00052-of-00092.safetensors",
+ "model.layers.51.self_attn.q_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.self_attn.q_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.51.self_attn.v_proj.bias": "model-00052-of-00092.safetensors",
+ "model.layers.51.self_attn.v_proj.weight": "model-00052-of-00092.safetensors",
+ "model.layers.51.self_attn.v_proj.weight_scale": "model-00052-of-00092.safetensors",
+ "model.layers.52.input_layernorm.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.0.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.0.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.0.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.0.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.0.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.0.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.1.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.1.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.1.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.1.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.1.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.1.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.10.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.10.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.10.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.10.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.10.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.10.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.100.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.100.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.100.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.100.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.100.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.100.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.101.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.101.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.101.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.101.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.101.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.101.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.102.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.102.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.102.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.102.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.102.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.102.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.103.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.103.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.103.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.103.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.103.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.103.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.104.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.104.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.104.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.104.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.104.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.104.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.105.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.105.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.105.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.105.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.105.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.105.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.106.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.106.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.106.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.106.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.106.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.106.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.107.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.107.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.107.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.107.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.107.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.107.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.108.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.108.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.108.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.108.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.108.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.108.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.109.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.109.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.109.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.109.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.109.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.109.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.11.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.11.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.11.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.11.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.11.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.11.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.110.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.110.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.110.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.110.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.110.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.110.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.111.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.111.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.111.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.111.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.111.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.111.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.112.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.112.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.112.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.112.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.112.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.112.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.113.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.113.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.113.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.113.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.113.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.113.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.114.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.114.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.114.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.114.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.114.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.114.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.115.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.115.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.115.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.115.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.115.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.115.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.116.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.116.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.116.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.116.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.116.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.116.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.117.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.117.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.117.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.117.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.117.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.117.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.118.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.118.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.118.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.118.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.118.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.118.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.119.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.119.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.119.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.119.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.119.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.119.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.12.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.12.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.12.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.12.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.12.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.12.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.120.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.120.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.120.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.120.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.120.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.120.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.121.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.121.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.121.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.121.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.121.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.121.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.122.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.122.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.122.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.122.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.122.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.122.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.123.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.123.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.123.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.123.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.123.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.123.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.124.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.124.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.124.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.124.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.124.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.124.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.125.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.125.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.125.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.125.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.125.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.125.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.126.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.126.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.126.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.126.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.126.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.126.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.127.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.127.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.127.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.127.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.127.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.127.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.128.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.128.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.128.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.128.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.128.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.128.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.129.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.129.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.129.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.129.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.129.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.129.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.13.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.13.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.13.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.13.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.13.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.13.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.130.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.130.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.130.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.130.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.130.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.130.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.131.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.131.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.131.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.131.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.131.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.131.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.132.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.132.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.132.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.132.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.132.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.132.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.133.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.133.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.133.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.133.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.133.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.133.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.134.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.134.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.134.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.134.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.134.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.134.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.135.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.135.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.135.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.135.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.135.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.135.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.136.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.136.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.136.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.136.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.136.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.136.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.137.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.137.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.137.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.137.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.137.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.137.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.138.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.138.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.138.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.138.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.138.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.138.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.139.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.139.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.139.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.139.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.139.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.139.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.14.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.14.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.14.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.14.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.14.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.14.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.140.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.140.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.140.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.140.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.140.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.140.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.141.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.141.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.141.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.141.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.141.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.141.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.142.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.142.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.142.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.142.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.142.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.142.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.143.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.143.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.143.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.143.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.143.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.143.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.144.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.144.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.144.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.144.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.144.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.144.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.145.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.145.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.145.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.145.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.145.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.145.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.146.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.146.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.146.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.146.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.146.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.146.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.147.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.147.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.147.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.147.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.147.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.147.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.148.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.148.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.148.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.148.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.148.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.148.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.149.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.149.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.149.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.149.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.149.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.149.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.15.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.15.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.15.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.15.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.15.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.15.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.150.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.150.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.150.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.150.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.150.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.150.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.151.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.151.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.151.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.151.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.151.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.151.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.152.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.152.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.152.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.152.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.152.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.152.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.153.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.153.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.153.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.153.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.153.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.153.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.154.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.154.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.154.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.154.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.154.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.154.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.155.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.155.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.155.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.155.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.155.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.155.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.156.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.156.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.156.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.156.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.156.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.156.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.157.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.157.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.157.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.157.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.157.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.157.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.158.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.158.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.158.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.158.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.158.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.158.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.159.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.159.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.159.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.159.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.159.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.159.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.16.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.16.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.16.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.16.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.16.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.16.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.17.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.17.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.17.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.17.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.17.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.17.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.18.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.18.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.18.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.18.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.18.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.18.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.19.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.19.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.19.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.19.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.19.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.19.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.2.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.2.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.2.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.2.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.2.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.2.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.20.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.20.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.20.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.20.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.20.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.20.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.21.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.21.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.21.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.21.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.21.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.21.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.22.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.22.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.22.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.22.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.22.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.22.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.23.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.23.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.23.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.23.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.23.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.23.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.24.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.24.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.24.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.24.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.24.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.24.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.25.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.25.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.25.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.25.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.25.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.25.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.26.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.26.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.26.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.26.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.26.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.26.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.27.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.27.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.27.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.27.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.27.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.27.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.28.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.28.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.28.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.28.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.28.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.28.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.29.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.29.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.29.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.29.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.29.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.29.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.3.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.3.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.3.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.3.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.3.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.3.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.30.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.30.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.30.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.30.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.30.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.30.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.31.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.31.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.31.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.31.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.31.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.31.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.32.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.32.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.32.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.32.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.32.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.32.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.33.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.33.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.33.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.33.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.33.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.33.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.34.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.34.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.34.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.34.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.34.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.34.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.35.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.35.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.35.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.35.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.35.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.35.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.36.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.36.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.36.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.36.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.36.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.36.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.37.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.37.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.37.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.37.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.37.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.37.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.38.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.38.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.38.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.38.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.38.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.38.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.39.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.39.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.39.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.39.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.39.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.39.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.4.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.4.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.4.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.4.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.4.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.4.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.40.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.40.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.40.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.40.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.40.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.40.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.41.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.41.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.41.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.41.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.41.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.41.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.42.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.42.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.42.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.42.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.42.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.42.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.43.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.43.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.43.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.43.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.43.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.43.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.44.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.44.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.44.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.44.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.44.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.44.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.45.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.45.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.45.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.45.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.45.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.45.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.46.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.46.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.46.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.46.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.46.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.46.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.47.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.47.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.47.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.47.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.47.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.47.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.48.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.48.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.48.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.48.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.48.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.48.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.49.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.49.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.49.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.49.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.49.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.49.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.5.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.5.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.5.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.5.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.5.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.5.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.50.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.50.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.50.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.50.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.50.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.50.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.51.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.51.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.51.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.51.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.51.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.51.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.52.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.52.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.52.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.52.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.52.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.52.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.53.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.53.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.53.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.53.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.53.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.53.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.54.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.54.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.54.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.54.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.54.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.54.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.55.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.55.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.55.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.55.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.55.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.55.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.56.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.56.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.56.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.56.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.56.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.56.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.57.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.57.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.57.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.57.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.57.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.57.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.58.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.58.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.58.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.58.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.58.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.58.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.59.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.59.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.59.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.59.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.59.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.59.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.6.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.6.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.6.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.6.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.6.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.6.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.60.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.60.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.60.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.60.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.60.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.60.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.61.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.61.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.61.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.61.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.61.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.61.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.62.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.62.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.62.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.62.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.62.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.62.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.63.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.63.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.63.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.63.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.63.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.63.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.64.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.64.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.64.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.64.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.64.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.64.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.65.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.65.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.65.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.65.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.65.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.65.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.66.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.66.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.66.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.66.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.66.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.66.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.67.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.67.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.67.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.67.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.67.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.67.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.68.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.68.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.68.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.68.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.68.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.68.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.69.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.69.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.69.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.69.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.69.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.69.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.7.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.7.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.7.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.7.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.7.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.7.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.70.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.70.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.70.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.70.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.70.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.70.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.71.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.71.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.71.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.71.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.71.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.71.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.72.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.72.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.72.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.72.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.72.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.72.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.73.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.73.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.73.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.73.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.73.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.73.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.74.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.74.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.74.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.74.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.74.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.74.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.75.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.75.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.75.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.75.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.75.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.75.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.76.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.76.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.76.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.76.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.76.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.76.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.77.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.77.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.77.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.77.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.77.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.77.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.78.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.78.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.78.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.78.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.78.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.78.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.79.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.79.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.79.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.79.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.79.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.79.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.8.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.8.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.8.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.8.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.8.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.8.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.80.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.80.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.80.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.80.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.80.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.80.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.81.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.81.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.81.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.81.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.81.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.81.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.82.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.82.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.82.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.82.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.82.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.82.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.83.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.83.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.83.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.83.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.83.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.83.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.84.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.84.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.84.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.84.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.84.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.84.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.85.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.85.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.85.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.85.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.85.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.85.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.86.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.86.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.86.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.86.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.86.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.86.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.87.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.87.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.87.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.87.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.87.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.87.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.88.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.88.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.88.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.88.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.88.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.88.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.89.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.89.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.89.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.89.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.89.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.89.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.9.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.9.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.9.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.9.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.9.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.9.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.90.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.90.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.90.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.90.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.90.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.90.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.91.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.91.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.91.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.91.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.91.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.91.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.92.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.92.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.92.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.92.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.92.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.92.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.93.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.93.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.93.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.93.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.93.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.93.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.94.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.94.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.94.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.94.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.94.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.94.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.95.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.95.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.95.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.95.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.95.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.95.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.96.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.96.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.96.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.96.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.96.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.96.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.97.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.97.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.97.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.97.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.97.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.97.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.98.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.98.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.98.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.98.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.98.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.98.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.99.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.99.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.99.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.99.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.99.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.experts.99.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.gate.e_score_correction_bias": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.gate.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.shared_experts.down_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.shared_experts.down_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.shared_experts.gate_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.shared_experts.gate_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.shared_experts.up_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.mlp.shared_experts.up_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.post_attention_layernorm.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.self_attn.k_norm.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.self_attn.k_proj.bias": "model-00053-of-00092.safetensors",
+ "model.layers.52.self_attn.k_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.self_attn.k_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.self_attn.o_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.self_attn.o_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.self_attn.q_norm.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.self_attn.q_proj.bias": "model-00053-of-00092.safetensors",
+ "model.layers.52.self_attn.q_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.self_attn.q_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.52.self_attn.v_proj.bias": "model-00053-of-00092.safetensors",
+ "model.layers.52.self_attn.v_proj.weight": "model-00053-of-00092.safetensors",
+ "model.layers.52.self_attn.v_proj.weight_scale": "model-00053-of-00092.safetensors",
+ "model.layers.53.input_layernorm.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.0.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.0.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.0.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.0.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.0.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.0.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.1.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.1.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.1.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.1.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.1.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.1.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.10.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.10.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.10.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.10.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.10.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.10.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.100.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.100.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.100.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.100.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.100.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.100.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.101.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.101.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.101.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.101.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.101.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.101.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.102.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.102.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.102.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.102.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.102.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.102.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.103.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.103.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.103.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.103.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.103.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.103.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.104.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.104.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.104.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.104.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.104.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.104.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.105.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.105.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.105.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.105.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.105.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.105.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.106.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.106.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.106.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.106.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.106.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.106.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.107.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.107.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.107.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.107.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.107.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.107.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.108.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.108.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.108.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.108.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.108.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.108.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.109.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.109.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.109.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.109.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.109.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.109.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.11.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.11.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.11.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.11.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.11.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.11.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.110.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.110.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.110.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.110.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.110.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.110.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.111.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.111.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.111.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.111.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.111.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.111.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.112.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.112.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.112.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.112.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.112.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.112.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.113.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.113.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.113.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.113.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.113.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.113.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.114.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.114.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.114.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.114.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.114.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.114.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.115.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.115.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.115.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.115.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.115.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.115.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.116.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.116.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.116.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.116.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.116.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.116.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.117.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.117.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.117.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.117.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.117.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.117.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.118.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.118.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.118.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.118.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.118.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.118.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.119.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.119.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.119.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.119.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.119.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.119.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.12.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.12.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.12.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.12.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.12.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.12.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.120.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.120.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.120.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.120.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.120.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.120.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.121.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.121.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.121.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.121.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.121.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.121.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.122.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.122.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.122.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.122.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.122.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.122.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.123.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.123.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.123.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.123.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.123.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.123.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.124.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.124.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.124.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.124.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.124.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.124.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.125.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.125.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.125.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.125.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.125.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.125.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.126.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.126.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.126.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.126.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.126.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.126.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.127.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.127.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.127.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.127.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.127.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.127.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.128.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.128.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.128.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.128.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.128.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.128.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.129.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.129.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.129.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.129.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.129.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.129.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.13.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.13.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.13.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.13.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.13.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.13.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.130.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.130.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.130.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.130.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.130.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.130.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.131.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.131.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.131.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.131.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.131.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.131.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.132.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.132.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.132.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.132.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.132.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.132.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.133.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.133.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.133.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.133.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.133.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.133.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.134.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.134.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.134.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.134.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.134.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.134.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.135.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.135.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.135.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.135.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.135.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.135.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.136.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.136.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.136.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.136.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.136.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.136.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.137.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.137.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.137.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.137.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.137.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.137.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.138.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.138.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.138.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.138.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.138.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.138.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.139.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.139.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.139.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.139.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.139.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.139.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.14.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.14.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.14.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.14.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.14.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.14.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.140.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.140.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.140.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.140.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.140.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.140.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.141.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.141.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.141.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.141.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.141.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.141.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.142.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.142.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.142.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.142.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.142.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.142.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.143.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.143.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.143.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.143.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.143.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.143.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.144.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.144.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.144.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.144.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.144.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.144.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.145.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.145.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.145.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.145.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.145.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.145.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.146.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.146.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.146.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.146.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.146.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.146.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.147.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.147.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.147.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.147.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.147.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.147.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.148.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.148.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.148.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.148.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.148.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.148.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.149.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.149.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.149.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.149.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.149.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.149.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.15.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.15.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.15.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.15.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.15.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.15.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.150.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.150.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.150.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.150.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.150.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.150.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.151.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.151.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.151.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.151.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.151.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.151.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.152.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.152.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.152.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.152.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.152.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.152.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.153.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.153.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.153.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.153.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.153.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.153.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.154.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.154.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.154.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.154.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.154.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.154.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.155.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.155.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.155.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.155.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.155.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.155.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.156.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.156.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.156.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.156.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.156.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.156.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.157.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.157.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.157.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.157.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.157.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.157.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.158.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.158.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.158.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.158.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.158.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.158.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.159.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.159.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.159.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.159.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.159.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.159.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.16.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.16.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.16.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.16.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.16.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.16.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.17.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.17.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.17.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.17.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.17.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.17.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.18.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.18.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.18.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.18.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.18.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.18.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.19.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.19.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.19.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.19.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.19.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.19.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.2.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.2.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.2.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.2.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.2.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.2.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.20.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.20.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.20.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.20.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.20.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.20.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.21.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.21.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.21.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.21.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.21.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.21.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.22.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.22.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.22.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.22.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.22.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.22.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.23.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.23.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.23.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.23.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.23.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.23.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.24.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.24.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.24.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.24.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.24.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.24.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.25.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.25.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.25.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.25.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.25.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.25.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.26.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.26.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.26.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.26.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.26.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.26.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.27.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.27.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.27.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.27.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.27.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.27.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.28.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.28.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.28.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.28.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.28.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.28.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.29.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.29.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.29.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.29.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.29.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.29.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.3.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.3.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.3.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.3.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.3.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.3.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.30.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.30.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.30.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.30.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.30.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.30.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.31.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.31.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.31.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.31.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.31.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.31.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.32.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.32.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.32.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.32.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.32.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.32.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.33.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.33.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.33.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.33.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.33.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.33.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.34.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.34.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.34.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.34.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.34.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.34.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.35.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.35.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.35.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.35.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.35.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.35.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.36.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.36.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.36.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.36.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.36.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.36.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.37.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.37.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.37.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.37.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.37.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.37.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.38.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.38.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.38.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.38.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.38.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.38.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.39.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.39.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.39.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.39.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.39.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.39.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.4.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.4.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.4.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.4.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.4.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.4.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.40.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.40.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.40.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.40.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.40.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.40.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.41.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.41.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.41.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.41.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.41.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.41.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.42.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.42.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.42.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.42.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.42.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.42.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.43.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.43.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.43.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.43.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.43.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.43.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.44.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.44.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.44.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.44.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.44.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.44.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.45.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.45.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.45.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.45.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.45.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.45.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.46.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.46.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.46.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.46.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.46.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.46.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.47.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.47.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.47.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.47.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.47.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.47.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.48.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.48.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.48.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.48.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.48.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.48.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.49.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.49.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.49.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.49.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.49.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.49.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.5.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.5.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.5.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.5.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.5.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.5.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.50.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.50.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.50.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.50.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.50.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.50.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.51.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.51.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.51.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.51.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.51.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.51.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.52.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.52.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.52.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.52.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.52.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.52.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.53.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.53.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.53.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.53.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.53.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.53.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.54.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.54.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.54.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.54.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.54.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.54.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.55.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.55.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.55.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.55.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.55.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.55.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.56.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.56.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.56.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.56.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.56.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.56.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.57.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.57.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.57.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.57.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.57.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.57.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.58.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.58.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.58.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.58.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.58.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.58.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.59.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.59.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.59.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.59.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.59.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.59.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.6.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.6.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.6.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.6.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.6.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.6.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.60.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.60.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.60.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.60.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.60.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.60.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.61.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.61.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.61.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.61.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.61.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.61.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.62.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.62.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.62.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.62.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.62.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.62.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.63.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.63.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.63.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.63.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.63.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.63.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.64.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.64.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.64.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.64.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.64.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.64.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.65.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.65.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.65.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.65.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.65.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.65.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.66.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.66.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.66.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.66.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.66.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.66.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.67.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.67.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.67.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.67.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.67.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.67.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.68.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.68.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.68.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.68.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.68.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.68.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.69.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.69.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.69.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.69.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.69.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.69.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.7.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.7.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.7.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.7.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.7.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.7.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.70.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.70.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.70.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.70.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.70.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.70.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.71.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.71.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.71.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.71.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.71.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.71.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.72.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.72.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.72.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.72.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.72.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.72.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.73.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.73.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.73.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.73.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.73.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.73.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.74.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.74.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.74.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.74.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.74.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.74.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.75.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.75.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.75.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.75.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.75.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.75.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.76.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.76.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.76.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.76.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.76.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.76.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.77.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.77.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.77.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.77.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.77.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.77.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.78.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.78.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.78.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.78.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.78.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.78.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.79.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.79.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.79.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.79.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.79.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.79.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.8.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.8.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.8.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.8.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.8.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.8.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.80.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.80.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.80.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.80.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.80.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.80.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.81.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.81.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.81.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.81.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.81.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.81.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.82.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.82.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.82.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.82.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.82.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.82.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.83.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.83.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.83.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.83.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.83.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.83.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.84.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.84.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.84.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.84.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.84.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.84.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.85.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.85.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.85.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.85.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.85.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.85.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.86.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.86.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.86.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.86.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.86.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.86.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.87.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.87.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.87.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.87.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.87.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.87.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.88.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.88.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.88.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.88.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.88.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.88.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.89.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.89.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.89.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.89.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.89.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.89.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.9.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.9.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.9.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.9.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.9.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.9.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.90.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.90.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.90.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.90.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.90.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.90.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.91.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.91.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.91.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.91.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.91.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.91.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.92.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.92.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.92.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.92.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.92.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.92.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.93.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.93.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.93.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.93.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.93.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.93.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.94.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.94.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.94.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.94.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.94.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.94.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.95.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.95.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.95.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.95.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.95.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.95.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.96.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.96.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.96.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.96.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.96.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.96.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.97.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.97.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.97.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.97.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.97.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.97.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.98.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.98.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.98.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.98.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.98.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.98.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.99.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.99.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.99.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.99.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.99.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.experts.99.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.gate.e_score_correction_bias": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.gate.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.shared_experts.down_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.shared_experts.down_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.shared_experts.gate_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.shared_experts.gate_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.shared_experts.up_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.mlp.shared_experts.up_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.post_attention_layernorm.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.self_attn.k_norm.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.self_attn.k_proj.bias": "model-00054-of-00092.safetensors",
+ "model.layers.53.self_attn.k_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.self_attn.k_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.self_attn.o_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.self_attn.o_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.self_attn.q_norm.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.self_attn.q_proj.bias": "model-00054-of-00092.safetensors",
+ "model.layers.53.self_attn.q_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.self_attn.q_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.53.self_attn.v_proj.bias": "model-00054-of-00092.safetensors",
+ "model.layers.53.self_attn.v_proj.weight": "model-00054-of-00092.safetensors",
+ "model.layers.53.self_attn.v_proj.weight_scale": "model-00054-of-00092.safetensors",
+ "model.layers.54.input_layernorm.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.0.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.0.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.0.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.0.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.0.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.0.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.1.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.1.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.1.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.1.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.1.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.1.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.10.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.10.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.10.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.10.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.10.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.10.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.100.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.100.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.100.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.100.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.100.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.100.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.101.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.101.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.101.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.101.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.101.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.101.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.102.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.102.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.102.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.102.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.102.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.102.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.103.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.103.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.103.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.103.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.103.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.103.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.104.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.104.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.104.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.104.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.104.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.104.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.105.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.105.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.105.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.105.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.105.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.105.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.106.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.106.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.106.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.106.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.106.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.106.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.107.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.107.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.107.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.107.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.107.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.107.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.108.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.108.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.108.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.108.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.108.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.108.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.109.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.109.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.109.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.109.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.109.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.109.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.11.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.11.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.11.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.11.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.11.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.11.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.110.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.110.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.110.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.110.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.110.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.110.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.111.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.111.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.111.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.111.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.111.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.111.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.112.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.112.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.112.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.112.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.112.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.112.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.113.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.113.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.113.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.113.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.113.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.113.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.114.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.114.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.114.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.114.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.114.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.114.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.115.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.115.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.115.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.115.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.115.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.115.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.116.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.116.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.116.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.116.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.116.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.116.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.117.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.117.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.117.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.117.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.117.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.117.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.118.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.118.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.118.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.118.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.118.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.118.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.119.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.119.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.119.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.119.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.119.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.119.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.12.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.12.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.12.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.12.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.12.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.12.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.120.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.120.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.120.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.120.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.120.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.120.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.121.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.121.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.121.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.121.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.121.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.121.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.122.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.122.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.122.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.122.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.122.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.122.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.123.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.123.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.123.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.123.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.123.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.123.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.124.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.124.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.124.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.124.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.124.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.124.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.125.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.125.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.125.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.125.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.125.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.125.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.126.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.126.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.126.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.126.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.126.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.126.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.127.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.127.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.127.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.127.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.127.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.127.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.128.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.128.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.128.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.128.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.128.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.128.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.129.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.129.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.129.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.129.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.129.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.129.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.13.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.13.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.13.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.13.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.13.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.13.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.130.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.130.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.130.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.130.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.130.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.130.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.131.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.131.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.131.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.131.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.131.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.131.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.132.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.132.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.132.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.132.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.132.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.132.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.133.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.133.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.133.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.133.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.133.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.133.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.134.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.134.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.134.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.134.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.134.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.134.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.135.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.135.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.135.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.135.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.135.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.135.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.136.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.136.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.136.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.136.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.136.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.136.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.137.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.137.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.137.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.137.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.137.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.137.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.138.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.138.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.138.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.138.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.138.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.138.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.139.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.139.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.139.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.139.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.139.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.139.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.14.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.14.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.14.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.14.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.14.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.14.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.140.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.140.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.140.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.140.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.140.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.140.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.141.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.141.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.141.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.141.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.141.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.141.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.142.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.142.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.142.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.142.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.142.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.142.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.143.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.143.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.143.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.143.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.143.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.143.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.144.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.144.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.144.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.144.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.144.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.144.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.145.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.145.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.145.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.145.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.145.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.145.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.146.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.146.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.146.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.146.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.146.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.146.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.147.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.147.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.147.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.147.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.147.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.147.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.148.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.148.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.148.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.148.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.148.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.148.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.149.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.149.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.149.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.149.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.149.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.149.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.15.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.15.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.15.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.15.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.15.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.15.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.150.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.150.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.150.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.150.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.150.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.150.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.151.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.151.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.151.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.151.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.151.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.151.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.152.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.152.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.152.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.152.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.152.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.152.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.153.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.153.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.153.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.153.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.153.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.153.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.154.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.154.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.154.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.154.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.154.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.154.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.155.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.155.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.155.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.155.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.155.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.155.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.156.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.156.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.156.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.156.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.156.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.156.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.157.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.157.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.157.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.157.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.157.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.157.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.158.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.158.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.158.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.158.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.158.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.158.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.159.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.159.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.159.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.159.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.159.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.159.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.16.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.16.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.16.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.16.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.16.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.16.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.17.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.17.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.17.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.17.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.17.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.17.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.18.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.18.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.18.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.18.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.18.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.18.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.19.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.19.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.19.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.19.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.19.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.19.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.2.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.2.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.2.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.2.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.2.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.2.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.20.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.20.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.20.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.20.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.20.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.20.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.21.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.21.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.21.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.21.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.21.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.21.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.22.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.22.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.22.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.22.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.22.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.22.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.23.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.23.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.23.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.23.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.23.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.23.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.24.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.24.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.24.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.24.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.24.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.24.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.25.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.25.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.25.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.25.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.25.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.25.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.26.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.26.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.26.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.26.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.26.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.26.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.27.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.27.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.27.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.27.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.27.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.27.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.28.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.28.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.28.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.28.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.28.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.28.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.29.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.29.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.29.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.29.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.29.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.29.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.3.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.3.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.3.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.3.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.3.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.3.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.30.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.30.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.30.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.30.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.30.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.30.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.31.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.31.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.31.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.31.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.31.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.31.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.32.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.32.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.32.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.32.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.32.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.32.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.33.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.33.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.33.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.33.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.33.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.33.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.34.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.34.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.34.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.34.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.34.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.34.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.35.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.35.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.35.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.35.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.35.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.35.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.36.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.36.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.36.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.36.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.36.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.36.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.37.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.37.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.37.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.37.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.37.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.37.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.38.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.38.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.38.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.38.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.38.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.38.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.39.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.39.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.39.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.39.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.39.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.39.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.4.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.4.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.4.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.4.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.4.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.4.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.40.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.40.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.40.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.40.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.40.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.40.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.41.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.41.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.41.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.41.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.41.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.41.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.42.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.42.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.42.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.42.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.42.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.42.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.43.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.43.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.43.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.43.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.43.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.43.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.44.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.44.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.44.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.44.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.44.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.44.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.45.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.45.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.45.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.45.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.45.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.45.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.46.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.46.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.46.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.46.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.46.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.46.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.47.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.47.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.47.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.47.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.47.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.47.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.48.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.48.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.48.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.48.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.48.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.48.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.49.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.49.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.49.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.49.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.49.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.49.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.5.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.5.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.5.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.5.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.5.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.5.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.50.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.50.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.50.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.50.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.50.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.50.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.51.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.51.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.51.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.51.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.51.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.51.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.52.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.52.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.52.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.52.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.52.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.52.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.53.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.53.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.53.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.53.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.53.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.53.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.54.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.54.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.54.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.54.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.54.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.54.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.55.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.55.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.55.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.55.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.55.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.55.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.56.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.56.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.56.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.56.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.56.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.56.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.57.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.57.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.57.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.57.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.57.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.57.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.58.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.58.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.58.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.58.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.58.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.58.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.59.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.59.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.59.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.59.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.59.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.59.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.6.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.6.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.6.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.6.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.6.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.6.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.60.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.60.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.60.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.60.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.60.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.60.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.61.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.61.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.61.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.61.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.61.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.61.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.62.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.62.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.62.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.62.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.62.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.62.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.63.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.63.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.63.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.63.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.63.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.63.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.64.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.64.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.64.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.64.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.64.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.64.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.65.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.65.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.65.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.65.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.65.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.65.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.66.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.66.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.66.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.66.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.66.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.66.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.67.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.67.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.67.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.67.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.67.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.67.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.68.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.68.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.68.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.68.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.68.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.68.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.69.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.69.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.69.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.69.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.69.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.69.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.7.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.7.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.7.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.7.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.7.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.7.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.70.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.70.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.70.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.70.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.70.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.70.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.71.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.71.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.71.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.71.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.71.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.71.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.72.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.72.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.72.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.72.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.72.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.72.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.73.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.73.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.73.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.73.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.73.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.73.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.74.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.74.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.74.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.74.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.74.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.74.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.75.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.75.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.75.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.75.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.75.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.75.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.76.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.76.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.76.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.76.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.76.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.76.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.77.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.77.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.77.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.77.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.77.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.77.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.78.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.78.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.78.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.78.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.78.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.78.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.79.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.79.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.79.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.79.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.79.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.79.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.8.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.8.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.8.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.8.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.8.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.8.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.80.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.80.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.80.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.80.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.80.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.80.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.81.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.81.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.81.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.81.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.81.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.81.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.82.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.82.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.82.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.82.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.82.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.82.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.83.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.83.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.83.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.83.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.83.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.83.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.84.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.84.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.84.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.84.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.84.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.84.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.85.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.85.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.85.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.85.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.85.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.85.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.86.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.86.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.86.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.86.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.86.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.86.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.87.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.87.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.87.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.87.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.87.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.87.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.88.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.88.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.88.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.88.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.88.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.88.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.89.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.89.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.89.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.89.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.89.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.89.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.9.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.9.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.9.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.9.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.9.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.9.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.90.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.90.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.90.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.90.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.90.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.90.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.91.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.91.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.91.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.91.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.91.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.91.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.92.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.92.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.92.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.92.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.92.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.92.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.93.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.93.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.93.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.93.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.93.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.93.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.94.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.94.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.94.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.94.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.94.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.94.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.95.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.95.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.95.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.95.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.95.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.95.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.96.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.96.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.96.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.96.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.96.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.96.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.97.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.97.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.97.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.97.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.97.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.97.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.98.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.98.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.98.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.98.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.98.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.98.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.99.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.99.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.99.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.99.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.99.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.experts.99.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.gate.e_score_correction_bias": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.gate.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.shared_experts.down_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.shared_experts.down_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.shared_experts.gate_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.shared_experts.gate_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.shared_experts.up_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.mlp.shared_experts.up_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.post_attention_layernorm.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.self_attn.k_norm.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.self_attn.k_proj.bias": "model-00055-of-00092.safetensors",
+ "model.layers.54.self_attn.k_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.self_attn.k_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.self_attn.o_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.self_attn.o_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.self_attn.q_norm.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.self_attn.q_proj.bias": "model-00055-of-00092.safetensors",
+ "model.layers.54.self_attn.q_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.self_attn.q_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.54.self_attn.v_proj.bias": "model-00055-of-00092.safetensors",
+ "model.layers.54.self_attn.v_proj.weight": "model-00055-of-00092.safetensors",
+ "model.layers.54.self_attn.v_proj.weight_scale": "model-00055-of-00092.safetensors",
+ "model.layers.55.input_layernorm.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.0.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.0.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.0.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.0.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.0.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.0.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.1.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.1.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.1.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.1.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.1.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.1.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.10.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.10.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.10.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.10.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.10.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.10.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.100.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.100.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.100.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.100.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.100.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.100.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.101.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.101.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.101.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.101.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.101.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.101.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.102.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.102.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.102.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.102.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.102.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.102.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.103.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.103.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.103.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.103.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.103.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.103.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.104.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.104.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.104.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.104.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.104.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.104.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.105.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.105.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.105.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.105.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.105.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.105.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.106.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.106.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.106.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.106.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.106.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.106.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.107.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.107.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.107.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.107.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.107.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.107.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.108.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.108.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.108.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.108.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.108.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.108.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.109.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.109.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.109.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.109.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.109.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.109.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.11.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.11.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.11.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.11.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.11.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.11.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.110.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.110.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.110.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.110.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.110.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.110.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.111.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.111.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.111.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.111.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.111.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.111.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.112.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.112.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.112.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.112.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.112.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.112.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.113.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.113.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.113.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.113.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.113.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.113.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.114.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.114.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.114.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.114.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.114.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.114.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.115.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.115.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.115.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.115.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.115.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.115.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.116.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.116.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.116.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.116.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.116.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.116.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.117.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.117.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.117.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.117.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.117.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.117.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.118.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.118.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.118.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.118.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.118.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.118.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.119.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.119.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.119.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.119.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.119.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.119.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.12.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.12.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.12.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.12.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.12.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.12.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.120.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.120.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.120.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.120.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.120.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.120.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.121.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.121.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.121.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.121.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.121.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.121.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.122.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.122.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.122.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.122.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.122.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.122.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.123.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.123.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.123.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.123.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.123.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.123.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.124.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.124.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.124.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.124.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.124.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.124.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.125.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.125.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.125.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.125.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.125.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.125.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.126.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.126.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.126.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.126.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.126.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.126.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.127.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.127.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.127.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.127.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.127.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.127.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.128.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.128.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.128.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.128.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.128.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.128.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.129.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.129.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.129.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.129.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.129.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.129.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.13.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.13.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.13.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.13.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.13.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.13.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.130.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.130.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.130.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.130.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.130.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.130.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.131.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.131.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.131.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.131.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.131.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.131.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.132.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.132.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.132.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.132.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.132.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.132.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.133.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.133.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.133.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.133.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.133.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.133.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.134.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.134.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.134.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.134.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.134.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.134.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.135.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.135.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.135.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.135.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.135.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.135.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.136.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.136.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.136.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.136.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.136.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.136.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.137.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.137.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.137.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.137.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.137.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.137.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.138.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.138.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.138.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.138.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.138.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.138.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.139.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.139.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.139.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.139.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.139.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.139.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.14.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.14.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.14.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.14.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.14.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.14.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.140.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.140.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.140.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.140.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.140.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.140.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.141.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.141.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.141.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.141.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.141.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.141.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.142.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.142.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.142.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.142.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.142.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.142.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.143.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.143.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.143.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.143.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.143.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.143.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.144.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.144.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.144.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.144.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.144.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.144.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.145.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.145.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.145.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.145.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.145.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.145.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.146.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.146.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.146.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.146.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.146.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.146.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.147.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.147.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.147.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.147.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.147.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.147.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.148.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.148.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.148.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.148.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.148.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.148.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.149.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.149.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.149.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.149.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.149.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.149.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.15.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.15.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.15.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.15.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.15.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.15.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.150.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.150.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.150.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.150.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.150.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.150.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.151.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.151.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.151.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.151.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.151.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.151.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.152.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.152.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.152.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.152.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.152.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.152.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.153.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.153.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.153.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.153.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.153.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.153.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.154.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.154.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.154.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.154.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.154.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.154.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.155.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.155.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.155.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.155.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.155.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.155.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.156.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.156.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.156.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.156.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.156.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.156.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.157.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.157.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.157.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.157.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.157.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.157.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.158.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.158.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.158.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.158.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.158.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.158.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.159.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.159.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.159.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.159.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.159.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.159.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.16.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.16.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.16.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.16.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.16.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.16.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.17.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.17.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.17.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.17.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.17.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.17.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.18.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.18.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.18.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.18.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.18.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.18.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.19.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.19.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.19.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.19.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.19.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.19.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.2.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.2.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.2.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.2.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.2.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.2.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.20.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.20.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.20.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.20.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.20.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.20.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.21.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.21.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.21.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.21.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.21.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.21.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.22.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.22.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.22.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.22.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.22.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.22.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.23.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.23.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.23.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.23.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.23.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.23.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.24.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.24.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.24.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.24.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.24.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.24.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.25.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.25.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.25.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.25.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.25.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.25.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.26.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.26.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.26.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.26.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.26.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.26.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.27.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.27.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.27.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.27.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.27.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.27.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.28.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.28.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.28.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.28.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.28.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.28.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.29.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.29.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.29.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.29.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.29.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.29.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.3.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.3.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.3.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.3.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.3.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.3.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.30.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.30.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.30.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.30.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.30.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.30.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.31.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.31.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.31.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.31.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.31.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.31.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.32.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.32.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.32.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.32.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.32.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.32.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.33.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.33.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.33.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.33.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.33.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.33.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.34.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.34.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.34.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.34.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.34.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.34.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.35.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.35.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.35.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.35.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.35.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.35.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.36.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.36.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.36.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.36.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.36.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.36.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.37.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.37.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.37.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.37.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.37.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.37.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.38.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.38.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.38.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.38.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.38.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.38.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.39.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.39.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.39.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.39.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.39.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.39.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.4.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.4.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.4.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.4.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.4.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.4.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.40.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.40.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.40.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.40.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.40.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.40.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.41.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.41.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.41.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.41.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.41.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.41.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.42.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.42.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.42.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.42.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.42.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.42.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.43.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.43.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.43.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.43.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.43.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.43.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.44.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.44.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.44.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.44.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.44.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.44.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.45.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.45.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.45.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.45.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.45.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.45.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.46.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.46.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.46.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.46.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.46.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.46.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.47.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.47.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.47.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.47.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.47.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.47.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.48.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.48.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.48.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.48.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.48.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.48.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.49.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.49.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.49.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.49.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.49.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.49.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.5.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.5.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.5.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.5.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.5.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.5.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.50.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.50.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.50.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.50.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.50.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.50.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.51.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.51.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.51.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.51.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.51.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.51.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.52.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.52.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.52.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.52.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.52.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.52.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.53.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.53.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.53.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.53.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.53.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.53.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.54.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.54.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.54.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.54.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.54.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.54.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.55.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.55.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.55.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.55.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.55.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.55.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.56.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.56.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.56.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.56.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.56.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.56.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.57.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.57.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.57.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.57.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.57.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.57.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.58.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.58.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.58.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.58.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.58.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.58.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.59.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.59.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.59.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.59.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.59.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.59.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.6.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.6.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.6.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.6.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.6.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.6.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.60.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.60.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.60.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.60.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.60.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.60.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.61.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.61.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.61.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.61.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.61.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.61.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.62.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.62.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.62.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.62.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.62.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.62.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.63.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.63.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.63.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.63.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.63.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.63.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.64.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.64.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.64.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.64.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.64.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.64.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.65.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.65.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.65.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.65.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.65.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.65.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.66.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.66.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.66.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.66.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.66.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.66.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.67.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.67.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.67.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.67.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.67.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.67.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.68.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.68.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.68.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.68.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.68.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.68.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.69.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.69.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.69.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.69.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.69.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.69.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.7.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.7.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.7.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.7.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.7.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.7.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.70.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.70.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.70.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.70.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.70.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.70.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.71.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.71.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.71.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.71.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.71.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.71.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.72.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.72.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.72.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.72.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.72.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.72.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.73.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.73.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.73.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.73.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.73.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.73.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.74.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.74.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.74.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.74.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.74.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.74.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.75.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.75.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.75.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.75.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.75.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.75.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.76.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.76.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.76.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.76.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.76.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.76.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.77.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.77.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.77.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.77.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.77.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.77.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.78.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.78.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.78.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.78.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.78.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.78.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.79.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.79.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.79.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.79.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.79.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.79.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.8.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.8.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.8.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.8.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.8.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.8.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.80.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.80.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.80.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.80.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.80.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.80.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.81.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.81.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.81.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.81.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.81.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.81.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.82.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.82.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.82.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.82.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.82.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.82.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.83.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.83.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.83.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.83.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.83.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.83.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.84.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.84.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.84.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.84.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.84.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.84.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.85.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.85.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.85.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.85.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.85.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.85.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.86.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.86.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.86.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.86.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.86.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.86.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.87.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.87.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.87.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.87.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.87.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.87.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.88.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.88.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.88.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.88.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.88.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.88.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.89.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.89.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.89.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.89.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.89.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.89.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.9.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.9.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.9.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.9.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.9.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.9.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.90.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.90.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.90.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.90.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.90.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.90.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.91.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.91.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.91.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.91.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.91.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.91.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.92.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.92.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.92.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.92.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.92.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.92.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.93.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.93.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.93.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.93.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.93.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.93.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.94.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.94.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.94.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.94.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.94.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.94.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.95.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.95.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.95.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.95.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.95.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.95.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.96.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.96.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.96.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.96.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.96.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.96.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.97.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.97.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.97.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.97.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.97.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.97.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.98.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.98.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.98.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.98.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.98.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.98.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.99.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.99.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.99.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.99.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.99.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.experts.99.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.gate.e_score_correction_bias": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.gate.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.shared_experts.down_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.shared_experts.down_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.shared_experts.gate_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.shared_experts.gate_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.shared_experts.up_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.mlp.shared_experts.up_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.post_attention_layernorm.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.self_attn.k_norm.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.self_attn.k_proj.bias": "model-00056-of-00092.safetensors",
+ "model.layers.55.self_attn.k_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.self_attn.k_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.self_attn.o_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.self_attn.o_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.self_attn.q_norm.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.self_attn.q_proj.bias": "model-00056-of-00092.safetensors",
+ "model.layers.55.self_attn.q_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.self_attn.q_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.55.self_attn.v_proj.bias": "model-00056-of-00092.safetensors",
+ "model.layers.55.self_attn.v_proj.weight": "model-00056-of-00092.safetensors",
+ "model.layers.55.self_attn.v_proj.weight_scale": "model-00056-of-00092.safetensors",
+ "model.layers.56.input_layernorm.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.0.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.0.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.0.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.0.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.0.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.0.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.1.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.1.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.1.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.1.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.1.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.1.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.10.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.10.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.10.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.10.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.10.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.10.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.100.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.100.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.100.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.100.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.100.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.100.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.101.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.101.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.101.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.101.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.101.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.101.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.102.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.102.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.102.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.102.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.102.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.102.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.103.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.103.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.103.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.103.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.103.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.103.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.104.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.104.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.104.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.104.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.104.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.104.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.105.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.105.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.105.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.105.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.105.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.105.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.106.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.106.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.106.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.106.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.106.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.106.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.107.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.107.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.107.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.107.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.107.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.107.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.108.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.108.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.108.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.108.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.108.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.108.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.109.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.109.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.109.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.109.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.109.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.109.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.11.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.11.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.11.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.11.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.11.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.11.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.110.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.110.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.110.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.110.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.110.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.110.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.111.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.111.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.111.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.111.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.111.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.111.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.112.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.112.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.112.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.112.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.112.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.112.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.113.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.113.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.113.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.113.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.113.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.113.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.114.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.114.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.114.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.114.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.114.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.114.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.115.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.115.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.115.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.115.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.115.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.115.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.116.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.116.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.116.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.116.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.116.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.116.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.117.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.117.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.117.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.117.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.117.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.117.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.118.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.118.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.118.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.118.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.118.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.118.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.119.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.119.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.119.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.119.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.119.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.119.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.12.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.12.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.12.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.12.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.12.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.12.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.120.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.120.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.120.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.120.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.120.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.120.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.121.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.121.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.121.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.121.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.121.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.121.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.122.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.122.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.122.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.122.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.122.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.122.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.123.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.123.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.123.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.123.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.123.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.123.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.124.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.124.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.124.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.124.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.124.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.124.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.125.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.125.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.125.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.125.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.125.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.125.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.126.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.126.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.126.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.126.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.126.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.126.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.127.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.127.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.127.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.127.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.127.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.127.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.128.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.128.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.128.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.128.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.128.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.128.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.129.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.129.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.129.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.129.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.129.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.129.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.13.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.13.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.13.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.13.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.13.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.13.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.130.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.130.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.130.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.130.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.130.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.130.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.131.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.131.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.131.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.131.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.131.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.131.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.132.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.132.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.132.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.132.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.132.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.132.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.133.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.133.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.133.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.133.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.133.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.133.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.134.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.134.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.134.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.134.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.134.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.134.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.135.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.135.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.135.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.135.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.135.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.135.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.136.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.136.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.136.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.136.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.136.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.136.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.137.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.137.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.137.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.137.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.137.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.137.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.138.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.138.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.138.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.138.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.138.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.138.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.139.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.139.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.139.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.139.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.139.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.139.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.14.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.14.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.14.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.14.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.14.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.14.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.140.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.140.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.140.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.140.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.140.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.140.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.141.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.141.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.141.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.141.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.141.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.141.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.142.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.142.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.142.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.142.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.142.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.142.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.143.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.143.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.143.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.143.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.143.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.143.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.144.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.144.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.144.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.144.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.144.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.144.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.145.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.145.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.145.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.145.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.145.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.145.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.146.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.146.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.146.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.146.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.146.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.146.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.147.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.147.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.147.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.147.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.147.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.147.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.148.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.148.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.148.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.148.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.148.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.148.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.149.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.149.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.149.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.149.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.149.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.149.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.15.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.15.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.15.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.15.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.15.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.15.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.150.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.150.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.150.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.150.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.150.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.150.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.151.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.151.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.151.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.151.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.151.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.151.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.152.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.152.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.152.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.152.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.152.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.152.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.153.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.153.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.153.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.153.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.153.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.153.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.154.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.154.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.154.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.154.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.154.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.154.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.155.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.155.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.155.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.155.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.155.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.155.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.156.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.156.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.156.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.156.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.156.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.156.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.157.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.157.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.157.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.157.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.157.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.157.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.158.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.158.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.158.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.158.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.158.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.158.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.159.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.159.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.159.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.159.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.159.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.159.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.16.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.16.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.16.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.16.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.16.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.16.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.17.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.17.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.17.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.17.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.17.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.17.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.18.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.18.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.18.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.18.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.18.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.18.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.19.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.19.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.19.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.19.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.19.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.19.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.2.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.2.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.2.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.2.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.2.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.2.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.20.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.20.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.20.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.20.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.20.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.20.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.21.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.21.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.21.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.21.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.21.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.21.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.22.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.22.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.22.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.22.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.22.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.22.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.23.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.23.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.23.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.23.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.23.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.23.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.24.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.24.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.24.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.24.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.24.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.24.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.25.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.25.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.25.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.25.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.25.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.25.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.26.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.26.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.26.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.26.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.26.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.26.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.27.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.27.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.27.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.27.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.27.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.27.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.28.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.28.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.28.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.28.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.28.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.28.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.29.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.29.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.29.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.29.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.29.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.29.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.3.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.3.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.3.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.3.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.3.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.3.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.30.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.30.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.30.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.30.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.30.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.30.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.31.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.31.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.31.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.31.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.31.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.31.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.32.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.32.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.32.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.32.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.32.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.32.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.33.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.33.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.33.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.33.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.33.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.33.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.34.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.34.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.34.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.34.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.34.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.34.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.35.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.35.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.35.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.35.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.35.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.35.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.36.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.36.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.36.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.36.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.36.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.36.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.37.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.37.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.37.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.37.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.37.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.37.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.38.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.38.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.38.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.38.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.38.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.38.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.39.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.39.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.39.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.39.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.39.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.39.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.4.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.4.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.4.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.4.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.4.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.4.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.40.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.40.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.40.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.40.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.40.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.40.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.41.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.41.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.41.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.41.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.41.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.41.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.42.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.42.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.42.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.42.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.42.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.42.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.43.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.43.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.43.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.43.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.43.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.43.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.44.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.44.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.44.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.44.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.44.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.44.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.45.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.45.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.45.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.45.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.45.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.45.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.46.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.46.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.46.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.46.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.46.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.46.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.47.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.47.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.47.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.47.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.47.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.47.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.48.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.48.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.48.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.48.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.48.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.48.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.49.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.49.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.49.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.49.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.49.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.49.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.5.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.5.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.5.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.5.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.5.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.5.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.50.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.50.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.50.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.50.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.50.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.50.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.51.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.51.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.51.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.51.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.51.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.51.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.52.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.52.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.52.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.52.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.52.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.52.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.53.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.53.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.53.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.53.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.53.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.53.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.54.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.54.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.54.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.54.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.54.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.54.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.55.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.55.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.55.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.55.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.55.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.55.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.56.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.56.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.56.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.56.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.56.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.56.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.57.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.57.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.57.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.57.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.57.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.57.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.58.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.58.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.58.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.58.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.58.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.58.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.59.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.59.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.59.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.59.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.59.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.59.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.6.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.6.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.6.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.6.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.6.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.6.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.60.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.60.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.60.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.60.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.60.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.60.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.61.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.61.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.61.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.61.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.61.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.61.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.62.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.62.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.62.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.62.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.62.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.62.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.63.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.63.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.63.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.63.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.63.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.63.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.64.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.64.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.64.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.64.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.64.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.64.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.65.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.65.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.65.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.65.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.65.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.65.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.66.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.66.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.66.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.66.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.66.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.66.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.67.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.67.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.67.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.67.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.67.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.67.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.68.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.68.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.68.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.68.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.68.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.68.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.69.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.69.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.69.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.69.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.69.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.69.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.7.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.7.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.7.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.7.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.7.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.7.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.70.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.70.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.70.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.70.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.70.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.70.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.71.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.71.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.71.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.71.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.71.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.71.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.72.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.72.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.72.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.72.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.72.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.72.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.73.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.73.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.73.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.73.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.73.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.73.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.74.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.74.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.74.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.74.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.74.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.74.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.75.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.75.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.75.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.75.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.75.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.75.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.76.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.76.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.76.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.76.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.76.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.76.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.77.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.77.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.77.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.77.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.77.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.77.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.78.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.78.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.78.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.78.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.78.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.78.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.79.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.79.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.79.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.79.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.79.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.79.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.8.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.8.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.8.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.8.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.8.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.8.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.80.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.80.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.80.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.80.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.80.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.80.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.81.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.81.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.81.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.81.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.81.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.81.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.82.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.82.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.82.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.82.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.82.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.82.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.83.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.83.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.83.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.83.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.83.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.83.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.84.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.84.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.84.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.84.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.84.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.84.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.85.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.85.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.85.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.85.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.85.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.85.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.86.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.86.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.86.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.86.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.86.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.86.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.87.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.87.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.87.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.87.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.87.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.87.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.88.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.88.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.88.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.88.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.88.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.88.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.89.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.89.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.89.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.89.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.89.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.89.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.9.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.9.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.9.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.9.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.9.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.9.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.90.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.90.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.90.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.90.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.90.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.90.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.91.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.91.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.91.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.91.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.91.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.91.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.92.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.92.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.92.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.92.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.92.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.92.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.93.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.93.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.93.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.93.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.93.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.93.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.94.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.94.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.94.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.94.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.94.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.94.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.95.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.95.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.95.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.95.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.95.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.95.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.96.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.96.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.96.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.96.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.96.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.96.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.97.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.97.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.97.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.97.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.97.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.97.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.98.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.98.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.98.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.98.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.98.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.98.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.99.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.99.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.99.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.99.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.99.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.experts.99.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.gate.e_score_correction_bias": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.gate.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.shared_experts.down_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.shared_experts.down_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.shared_experts.gate_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.shared_experts.gate_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.shared_experts.up_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.mlp.shared_experts.up_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.post_attention_layernorm.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.self_attn.k_norm.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.self_attn.k_proj.bias": "model-00057-of-00092.safetensors",
+ "model.layers.56.self_attn.k_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.self_attn.k_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.self_attn.o_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.self_attn.o_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.self_attn.q_norm.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.self_attn.q_proj.bias": "model-00057-of-00092.safetensors",
+ "model.layers.56.self_attn.q_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.self_attn.q_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.56.self_attn.v_proj.bias": "model-00057-of-00092.safetensors",
+ "model.layers.56.self_attn.v_proj.weight": "model-00057-of-00092.safetensors",
+ "model.layers.56.self_attn.v_proj.weight_scale": "model-00057-of-00092.safetensors",
+ "model.layers.57.input_layernorm.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.0.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.0.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.0.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.0.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.0.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.0.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.1.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.1.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.1.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.1.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.1.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.1.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.10.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.10.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.10.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.10.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.10.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.10.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.100.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.100.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.100.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.100.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.100.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.100.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.101.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.101.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.101.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.101.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.101.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.101.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.102.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.102.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.102.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.102.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.102.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.102.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.103.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.103.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.103.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.103.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.103.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.103.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.104.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.104.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.104.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.104.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.104.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.104.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.105.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.105.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.105.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.105.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.105.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.105.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.106.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.106.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.106.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.106.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.106.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.106.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.107.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.107.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.107.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.107.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.107.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.107.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.108.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.108.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.108.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.108.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.108.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.108.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.109.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.109.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.109.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.109.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.109.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.109.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.11.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.11.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.11.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.11.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.11.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.11.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.110.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.110.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.110.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.110.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.110.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.110.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.111.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.111.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.111.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.111.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.111.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.111.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.112.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.112.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.112.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.112.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.112.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.112.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.113.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.113.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.113.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.113.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.113.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.113.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.114.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.114.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.114.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.114.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.114.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.114.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.115.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.115.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.115.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.115.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.115.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.115.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.116.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.116.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.116.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.116.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.116.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.116.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.117.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.117.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.117.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.117.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.117.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.117.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.118.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.118.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.118.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.118.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.118.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.118.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.119.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.119.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.119.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.119.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.119.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.119.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.12.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.12.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.12.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.12.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.12.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.12.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.120.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.120.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.120.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.120.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.120.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.120.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.121.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.121.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.121.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.121.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.121.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.121.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.122.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.122.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.122.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.122.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.122.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.122.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.123.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.123.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.123.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.123.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.123.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.123.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.124.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.124.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.124.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.124.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.124.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.124.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.125.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.125.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.125.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.125.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.125.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.125.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.126.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.126.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.126.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.126.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.126.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.126.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.127.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.127.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.127.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.127.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.127.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.127.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.128.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.128.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.128.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.128.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.128.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.128.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.129.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.129.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.129.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.129.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.129.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.129.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.13.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.13.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.13.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.13.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.13.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.13.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.130.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.130.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.130.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.130.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.130.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.130.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.131.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.131.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.131.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.131.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.131.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.131.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.132.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.132.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.132.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.132.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.132.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.132.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.133.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.133.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.133.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.133.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.133.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.133.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.134.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.134.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.134.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.134.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.134.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.134.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.135.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.135.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.135.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.135.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.135.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.135.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.136.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.136.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.136.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.136.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.136.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.136.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.137.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.137.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.137.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.137.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.137.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.137.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.138.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.138.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.138.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.138.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.138.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.138.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.139.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.139.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.139.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.139.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.139.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.139.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.14.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.14.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.14.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.14.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.14.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.14.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.140.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.140.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.140.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.140.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.140.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.140.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.141.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.141.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.141.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.141.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.141.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.141.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.142.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.142.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.142.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.142.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.142.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.142.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.143.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.143.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.143.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.143.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.143.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.143.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.144.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.144.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.144.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.144.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.144.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.144.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.145.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.145.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.145.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.145.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.145.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.145.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.146.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.146.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.146.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.146.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.146.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.146.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.147.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.147.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.147.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.147.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.147.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.147.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.148.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.148.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.148.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.148.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.148.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.148.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.149.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.149.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.149.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.149.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.149.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.149.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.15.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.15.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.15.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.15.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.15.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.15.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.150.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.150.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.150.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.150.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.150.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.150.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.151.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.151.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.151.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.151.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.151.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.151.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.152.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.152.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.152.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.152.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.152.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.152.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.153.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.153.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.153.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.153.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.153.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.153.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.154.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.154.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.154.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.154.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.154.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.154.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.155.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.155.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.155.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.155.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.155.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.155.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.156.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.156.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.156.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.156.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.156.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.156.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.157.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.157.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.157.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.157.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.157.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.157.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.158.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.158.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.158.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.158.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.158.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.158.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.159.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.159.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.159.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.159.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.159.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.159.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.16.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.16.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.16.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.16.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.16.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.16.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.17.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.17.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.17.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.17.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.17.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.17.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.18.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.18.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.18.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.18.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.18.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.18.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.19.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.19.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.19.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.19.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.19.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.19.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.2.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.2.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.2.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.2.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.2.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.2.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.20.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.20.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.20.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.20.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.20.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.20.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.21.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.21.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.21.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.21.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.21.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.21.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.22.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.22.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.22.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.22.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.22.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.22.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.23.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.23.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.23.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.23.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.23.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.23.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.24.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.24.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.24.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.24.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.24.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.24.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.25.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.25.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.25.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.25.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.25.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.25.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.26.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.26.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.26.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.26.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.26.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.26.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.27.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.27.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.27.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.27.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.27.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.27.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.28.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.28.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.28.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.28.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.28.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.28.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.29.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.29.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.29.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.29.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.29.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.29.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.3.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.3.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.3.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.3.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.3.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.3.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.30.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.30.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.30.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.30.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.30.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.30.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.31.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.31.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.31.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.31.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.31.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.31.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.32.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.32.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.32.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.32.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.32.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.32.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.33.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.33.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.33.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.33.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.33.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.33.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.34.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.34.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.34.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.34.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.34.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.34.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.35.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.35.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.35.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.35.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.35.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.35.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.36.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.36.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.36.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.36.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.36.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.36.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.37.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.37.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.37.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.37.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.37.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.37.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.38.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.38.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.38.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.38.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.38.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.38.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.39.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.39.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.39.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.39.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.39.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.39.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.4.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.4.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.4.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.4.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.4.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.4.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.40.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.40.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.40.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.40.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.40.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.40.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.41.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.41.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.41.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.41.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.41.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.41.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.42.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.42.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.42.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.42.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.42.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.42.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.43.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.43.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.43.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.43.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.43.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.43.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.44.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.44.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.44.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.44.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.44.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.44.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.45.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.45.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.45.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.45.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.45.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.45.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.46.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.46.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.46.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.46.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.46.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.46.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.47.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.47.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.47.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.47.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.47.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.47.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.48.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.48.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.48.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.48.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.48.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.48.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.49.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.49.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.49.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.49.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.49.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.49.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.5.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.5.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.5.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.5.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.5.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.5.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.50.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.50.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.50.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.50.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.50.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.50.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.51.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.51.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.51.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.51.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.51.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.51.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.52.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.52.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.52.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.52.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.52.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.52.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.53.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.53.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.53.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.53.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.53.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.53.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.54.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.54.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.54.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.54.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.54.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.54.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.55.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.55.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.55.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.55.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.55.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.55.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.56.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.56.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.56.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.56.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.56.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.56.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.57.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.57.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.57.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.57.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.57.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.57.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.58.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.58.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.58.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.58.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.58.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.58.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.59.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.59.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.59.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.59.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.59.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.59.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.6.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.6.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.6.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.6.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.6.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.6.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.60.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.60.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.60.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.60.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.60.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.60.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.61.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.61.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.61.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.61.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.61.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.61.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.62.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.62.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.62.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.62.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.62.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.62.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.63.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.63.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.63.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.63.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.63.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.63.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.64.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.64.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.64.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.64.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.64.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.64.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.65.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.65.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.65.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.65.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.65.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.65.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.66.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.66.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.66.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.66.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.66.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.66.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.67.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.67.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.67.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.67.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.67.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.67.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.68.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.68.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.68.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.68.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.68.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.68.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.69.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.69.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.69.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.69.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.69.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.69.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.7.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.7.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.7.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.7.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.7.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.7.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.70.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.70.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.70.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.70.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.70.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.70.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.71.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.71.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.71.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.71.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.71.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.71.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.72.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.72.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.72.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.72.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.72.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.72.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.73.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.73.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.73.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.73.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.73.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.73.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.74.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.74.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.74.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.74.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.74.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.74.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.75.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.75.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.75.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.75.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.75.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.75.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.76.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.76.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.76.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.76.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.76.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.76.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.77.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.77.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.77.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.77.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.77.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.77.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.78.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.78.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.78.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.78.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.78.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.78.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.79.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.79.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.79.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.79.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.79.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.79.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.8.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.8.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.8.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.8.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.8.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.8.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.80.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.80.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.80.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.80.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.80.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.80.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.81.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.81.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.81.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.81.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.81.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.81.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.82.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.82.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.82.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.82.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.82.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.82.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.83.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.83.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.83.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.83.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.83.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.83.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.84.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.84.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.84.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.84.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.84.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.84.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.85.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.85.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.85.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.85.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.85.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.85.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.86.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.86.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.86.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.86.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.86.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.86.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.87.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.87.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.87.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.87.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.87.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.87.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.88.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.88.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.88.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.88.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.88.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.88.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.89.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.89.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.89.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.89.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.89.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.89.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.9.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.9.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.9.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.9.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.9.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.9.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.90.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.90.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.90.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.90.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.90.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.90.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.91.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.91.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.91.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.91.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.91.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.91.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.92.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.92.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.92.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.92.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.92.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.92.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.93.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.93.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.93.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.93.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.93.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.93.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.94.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.94.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.94.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.94.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.94.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.94.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.95.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.95.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.95.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.95.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.95.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.95.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.96.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.96.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.96.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.96.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.96.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.96.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.97.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.97.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.97.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.97.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.97.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.97.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.98.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.98.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.98.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.98.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.98.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.98.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.99.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.99.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.99.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.99.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.99.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.experts.99.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.gate.e_score_correction_bias": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.gate.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.shared_experts.down_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.shared_experts.down_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.shared_experts.gate_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.shared_experts.gate_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.shared_experts.up_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.mlp.shared_experts.up_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.post_attention_layernorm.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.self_attn.k_norm.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.self_attn.k_proj.bias": "model-00058-of-00092.safetensors",
+ "model.layers.57.self_attn.k_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.self_attn.k_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.self_attn.o_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.self_attn.o_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.self_attn.q_norm.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.self_attn.q_proj.bias": "model-00058-of-00092.safetensors",
+ "model.layers.57.self_attn.q_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.self_attn.q_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.57.self_attn.v_proj.bias": "model-00058-of-00092.safetensors",
+ "model.layers.57.self_attn.v_proj.weight": "model-00058-of-00092.safetensors",
+ "model.layers.57.self_attn.v_proj.weight_scale": "model-00058-of-00092.safetensors",
+ "model.layers.58.input_layernorm.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.0.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.0.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.0.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.0.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.0.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.0.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.1.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.1.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.1.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.1.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.1.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.1.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.10.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.10.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.10.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.10.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.10.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.10.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.100.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.100.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.100.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.100.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.100.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.100.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.101.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.101.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.101.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.101.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.101.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.101.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.102.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.102.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.102.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.102.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.102.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.102.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.103.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.103.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.103.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.103.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.103.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.103.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.104.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.104.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.104.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.104.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.104.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.104.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.105.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.105.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.105.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.105.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.105.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.105.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.106.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.106.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.106.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.106.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.106.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.106.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.107.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.107.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.107.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.107.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.107.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.107.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.108.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.108.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.108.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.108.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.108.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.108.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.109.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.109.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.109.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.109.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.109.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.109.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.11.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.11.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.11.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.11.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.11.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.11.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.110.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.110.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.110.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.110.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.110.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.110.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.111.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.111.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.111.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.111.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.111.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.111.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.112.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.112.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.112.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.112.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.112.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.112.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.113.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.113.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.113.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.113.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.113.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.113.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.114.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.114.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.114.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.114.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.114.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.114.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.115.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.115.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.115.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.115.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.115.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.115.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.116.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.116.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.116.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.116.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.116.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.116.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.117.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.117.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.117.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.117.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.117.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.117.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.118.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.118.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.118.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.118.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.118.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.118.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.119.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.119.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.119.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.119.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.119.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.119.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.12.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.12.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.12.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.12.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.12.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.12.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.120.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.120.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.120.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.120.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.120.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.120.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.121.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.121.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.121.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.121.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.121.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.121.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.122.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.122.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.122.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.122.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.122.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.122.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.123.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.123.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.123.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.123.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.123.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.123.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.124.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.124.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.124.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.124.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.124.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.124.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.125.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.125.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.125.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.125.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.125.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.125.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.126.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.126.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.126.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.126.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.126.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.126.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.127.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.127.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.127.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.127.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.127.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.127.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.128.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.128.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.128.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.128.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.128.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.128.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.129.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.129.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.129.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.129.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.129.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.129.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.13.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.13.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.13.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.13.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.13.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.13.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.130.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.130.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.130.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.130.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.130.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.130.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.131.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.131.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.131.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.131.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.131.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.131.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.132.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.132.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.132.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.132.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.132.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.132.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.133.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.133.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.133.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.133.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.133.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.133.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.134.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.134.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.134.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.134.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.134.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.134.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.135.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.135.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.135.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.135.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.135.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.135.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.136.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.136.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.136.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.136.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.136.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.136.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.137.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.137.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.137.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.137.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.137.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.137.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.138.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.138.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.138.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.138.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.138.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.138.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.139.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.139.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.139.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.139.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.139.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.139.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.14.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.14.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.14.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.14.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.14.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.14.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.140.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.140.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.140.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.140.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.140.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.140.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.141.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.141.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.141.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.141.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.141.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.141.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.142.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.142.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.142.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.142.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.142.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.142.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.143.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.143.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.143.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.143.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.143.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.143.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.144.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.144.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.144.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.144.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.144.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.144.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.145.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.145.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.145.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.145.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.145.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.145.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.146.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.146.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.146.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.146.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.146.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.146.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.147.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.147.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.147.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.147.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.147.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.147.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.148.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.148.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.148.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.148.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.148.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.148.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.149.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.149.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.149.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.149.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.149.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.149.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.15.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.15.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.15.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.15.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.15.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.15.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.150.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.150.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.150.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.150.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.150.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.150.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.151.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.151.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.151.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.151.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.151.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.151.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.152.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.152.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.152.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.152.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.152.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.152.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.153.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.153.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.153.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.153.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.153.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.153.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.154.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.154.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.154.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.154.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.154.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.154.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.155.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.155.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.155.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.155.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.155.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.155.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.156.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.156.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.156.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.156.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.156.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.156.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.157.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.157.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.157.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.157.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.157.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.157.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.158.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.158.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.158.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.158.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.158.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.158.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.159.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.159.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.159.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.159.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.159.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.159.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.16.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.16.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.16.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.16.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.16.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.16.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.17.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.17.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.17.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.17.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.17.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.17.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.18.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.18.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.18.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.18.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.18.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.18.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.19.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.19.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.19.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.19.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.19.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.19.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.2.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.2.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.2.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.2.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.2.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.2.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.20.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.20.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.20.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.20.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.20.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.20.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.21.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.21.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.21.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.21.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.21.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.21.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.22.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.22.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.22.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.22.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.22.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.22.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.23.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.23.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.23.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.23.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.23.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.23.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.24.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.24.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.24.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.24.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.24.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.24.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.25.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.25.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.25.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.25.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.25.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.25.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.26.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.26.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.26.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.26.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.26.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.26.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.27.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.27.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.27.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.27.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.27.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.27.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.28.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.28.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.28.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.28.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.28.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.28.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.29.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.29.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.29.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.29.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.29.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.29.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.3.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.3.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.3.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.3.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.3.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.3.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.30.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.30.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.30.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.30.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.30.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.30.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.31.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.31.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.31.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.31.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.31.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.31.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.32.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.32.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.32.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.32.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.32.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.32.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.33.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.33.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.33.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.33.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.33.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.33.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.34.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.34.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.34.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.34.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.34.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.34.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.35.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.35.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.35.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.35.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.35.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.35.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.36.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.36.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.36.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.36.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.36.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.36.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.37.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.37.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.37.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.37.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.37.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.37.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.38.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.38.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.38.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.38.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.38.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.38.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.39.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.39.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.39.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.39.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.39.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.39.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.4.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.4.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.4.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.4.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.4.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.4.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.40.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.40.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.40.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.40.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.40.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.40.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.41.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.41.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.41.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.41.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.41.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.41.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.42.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.42.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.42.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.42.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.42.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.42.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.43.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.43.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.43.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.43.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.43.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.43.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.44.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.44.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.44.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.44.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.44.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.44.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.45.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.45.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.45.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.45.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.45.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.45.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.46.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.46.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.46.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.46.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.46.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.46.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.47.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.47.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.47.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.47.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.47.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.47.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.48.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.48.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.48.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.48.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.48.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.48.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.49.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.49.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.49.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.49.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.49.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.49.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.5.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.5.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.5.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.5.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.5.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.5.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.50.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.50.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.50.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.50.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.50.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.50.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.51.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.51.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.51.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.51.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.51.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.51.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.52.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.52.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.52.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.52.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.52.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.52.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.53.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.53.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.53.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.53.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.53.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.53.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.54.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.54.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.54.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.54.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.54.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.54.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.55.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.55.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.55.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.55.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.55.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.55.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.56.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.56.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.56.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.56.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.56.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.56.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.57.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.57.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.57.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.57.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.57.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.57.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.58.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.58.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.58.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.58.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.58.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.58.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.59.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.59.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.59.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.59.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.59.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.59.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.6.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.6.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.6.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.6.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.6.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.6.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.60.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.60.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.60.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.60.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.60.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.60.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.61.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.61.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.61.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.61.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.61.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.61.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.62.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.62.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.62.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.62.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.62.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.62.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.63.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.63.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.63.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.63.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.63.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.63.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.64.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.64.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.64.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.64.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.64.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.64.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.65.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.65.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.65.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.65.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.65.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.65.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.66.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.66.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.66.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.66.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.66.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.66.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.67.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.67.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.67.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.67.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.67.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.67.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.68.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.68.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.68.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.68.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.68.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.68.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.69.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.69.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.69.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.69.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.69.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.69.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.7.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.7.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.7.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.7.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.7.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.7.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.70.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.70.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.70.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.70.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.70.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.70.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.71.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.71.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.71.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.71.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.71.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.71.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.72.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.72.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.72.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.72.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.72.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.72.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.73.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.73.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.73.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.73.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.73.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.73.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.74.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.74.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.74.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.74.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.74.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.74.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.75.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.75.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.75.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.75.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.75.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.75.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.76.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.76.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.76.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.76.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.76.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.76.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.77.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.77.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.77.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.77.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.77.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.77.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.78.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.78.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.78.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.78.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.78.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.78.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.79.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.79.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.79.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.79.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.79.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.79.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.8.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.8.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.8.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.8.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.8.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.8.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.80.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.80.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.80.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.80.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.80.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.80.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.81.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.81.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.81.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.81.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.81.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.81.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.82.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.82.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.82.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.82.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.82.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.82.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.83.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.83.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.83.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.83.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.83.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.83.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.84.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.84.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.84.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.84.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.84.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.84.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.85.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.85.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.85.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.85.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.85.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.85.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.86.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.86.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.86.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.86.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.86.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.86.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.87.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.87.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.87.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.87.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.87.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.87.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.88.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.88.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.88.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.88.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.88.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.88.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.89.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.89.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.89.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.89.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.89.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.89.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.9.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.9.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.9.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.9.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.9.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.9.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.90.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.90.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.90.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.90.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.90.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.90.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.91.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.91.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.91.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.91.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.91.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.91.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.92.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.92.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.92.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.92.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.92.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.92.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.93.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.93.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.93.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.93.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.93.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.93.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.94.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.94.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.94.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.94.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.94.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.94.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.95.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.95.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.95.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.95.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.95.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.95.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.96.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.96.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.96.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.96.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.96.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.96.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.97.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.97.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.97.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.97.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.97.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.97.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.98.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.98.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.98.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.98.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.98.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.98.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.99.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.99.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.99.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.99.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.99.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.experts.99.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.gate.e_score_correction_bias": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.gate.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.shared_experts.down_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.shared_experts.down_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.shared_experts.gate_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.shared_experts.gate_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.shared_experts.up_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.mlp.shared_experts.up_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.post_attention_layernorm.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.self_attn.k_norm.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.self_attn.k_proj.bias": "model-00059-of-00092.safetensors",
+ "model.layers.58.self_attn.k_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.self_attn.k_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.self_attn.o_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.self_attn.o_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.self_attn.q_norm.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.self_attn.q_proj.bias": "model-00059-of-00092.safetensors",
+ "model.layers.58.self_attn.q_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.self_attn.q_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.58.self_attn.v_proj.bias": "model-00059-of-00092.safetensors",
+ "model.layers.58.self_attn.v_proj.weight": "model-00059-of-00092.safetensors",
+ "model.layers.58.self_attn.v_proj.weight_scale": "model-00059-of-00092.safetensors",
+ "model.layers.59.input_layernorm.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.0.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.0.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.0.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.0.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.0.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.0.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.1.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.1.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.1.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.1.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.1.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.1.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.10.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.10.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.10.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.10.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.10.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.10.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.100.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.100.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.100.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.100.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.100.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.100.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.101.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.101.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.101.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.101.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.101.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.101.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.102.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.102.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.102.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.102.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.102.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.102.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.103.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.103.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.103.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.103.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.103.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.103.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.104.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.104.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.104.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.104.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.104.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.104.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.105.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.105.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.105.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.105.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.105.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.105.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.106.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.106.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.106.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.106.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.106.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.106.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.107.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.107.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.107.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.107.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.107.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.107.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.108.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.108.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.108.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.108.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.108.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.108.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.109.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.109.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.109.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.109.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.109.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.109.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.11.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.11.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.11.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.11.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.11.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.11.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.110.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.110.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.110.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.110.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.110.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.110.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.111.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.111.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.111.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.111.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.111.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.111.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.112.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.112.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.112.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.112.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.112.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.112.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.113.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.113.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.113.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.113.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.113.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.113.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.114.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.114.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.114.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.114.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.114.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.114.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.115.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.115.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.115.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.115.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.115.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.115.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.116.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.116.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.116.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.116.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.116.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.116.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.117.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.117.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.117.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.117.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.117.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.117.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.118.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.118.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.118.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.118.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.118.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.118.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.119.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.119.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.119.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.119.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.119.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.119.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.12.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.12.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.12.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.12.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.12.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.12.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.120.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.120.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.120.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.120.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.120.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.120.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.121.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.121.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.121.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.121.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.121.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.121.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.122.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.122.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.122.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.122.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.122.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.122.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.123.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.123.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.123.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.123.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.123.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.123.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.124.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.124.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.124.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.124.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.124.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.124.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.125.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.125.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.125.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.125.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.125.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.125.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.126.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.126.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.126.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.126.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.126.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.126.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.127.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.127.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.127.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.127.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.127.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.127.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.128.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.128.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.128.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.128.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.128.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.128.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.129.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.129.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.129.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.129.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.129.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.129.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.13.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.13.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.13.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.13.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.13.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.13.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.130.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.130.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.130.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.130.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.130.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.130.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.131.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.131.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.131.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.131.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.131.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.131.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.132.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.132.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.132.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.132.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.132.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.132.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.133.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.133.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.133.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.133.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.133.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.133.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.134.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.134.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.134.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.134.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.134.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.134.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.135.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.135.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.135.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.135.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.135.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.135.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.136.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.136.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.136.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.136.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.136.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.136.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.137.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.137.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.137.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.137.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.137.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.137.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.138.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.138.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.138.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.138.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.138.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.138.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.139.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.139.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.139.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.139.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.139.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.139.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.14.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.14.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.14.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.14.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.14.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.14.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.140.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.140.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.140.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.140.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.140.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.140.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.141.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.141.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.141.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.141.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.141.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.141.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.142.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.142.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.142.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.142.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.142.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.142.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.143.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.143.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.143.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.143.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.143.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.143.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.144.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.144.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.144.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.144.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.144.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.144.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.145.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.145.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.145.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.145.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.145.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.145.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.146.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.146.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.146.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.146.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.146.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.146.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.147.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.147.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.147.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.147.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.147.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.147.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.148.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.148.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.148.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.148.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.148.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.148.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.149.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.149.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.149.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.149.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.149.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.149.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.15.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.15.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.15.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.15.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.15.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.15.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.150.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.150.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.150.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.150.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.150.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.150.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.151.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.151.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.151.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.151.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.151.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.151.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.152.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.152.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.152.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.152.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.152.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.152.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.153.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.153.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.153.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.153.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.153.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.153.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.154.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.154.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.154.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.154.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.154.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.154.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.155.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.155.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.155.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.155.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.155.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.155.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.156.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.156.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.156.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.156.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.156.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.156.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.157.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.157.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.157.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.157.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.157.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.157.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.158.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.158.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.158.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.158.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.158.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.158.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.159.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.159.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.159.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.159.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.159.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.159.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.16.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.16.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.16.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.16.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.16.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.16.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.17.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.17.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.17.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.17.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.17.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.17.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.18.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.18.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.18.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.18.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.18.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.18.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.19.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.19.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.19.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.19.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.19.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.19.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.2.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.2.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.2.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.2.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.2.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.2.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.20.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.20.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.20.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.20.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.20.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.20.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.21.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.21.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.21.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.21.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.21.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.21.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.22.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.22.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.22.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.22.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.22.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.22.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.23.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.23.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.23.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.23.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.23.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.23.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.24.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.24.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.24.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.24.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.24.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.24.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.25.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.25.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.25.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.25.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.25.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.25.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.26.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.26.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.26.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.26.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.26.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.26.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.27.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.27.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.27.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.27.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.27.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.27.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.28.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.28.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.28.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.28.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.28.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.28.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.29.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.29.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.29.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.29.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.29.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.29.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.3.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.3.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.3.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.3.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.3.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.3.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.30.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.30.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.30.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.30.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.30.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.30.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.31.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.31.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.31.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.31.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.31.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.31.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.32.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.32.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.32.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.32.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.32.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.32.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.33.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.33.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.33.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.33.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.33.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.33.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.34.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.34.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.34.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.34.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.34.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.34.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.35.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.35.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.35.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.35.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.35.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.35.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.36.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.36.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.36.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.36.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.36.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.36.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.37.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.37.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.37.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.37.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.37.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.37.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.38.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.38.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.38.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.38.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.38.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.38.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.39.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.39.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.39.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.39.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.39.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.39.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.4.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.4.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.4.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.4.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.4.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.4.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.40.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.40.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.40.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.40.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.40.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.40.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.41.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.41.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.41.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.41.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.41.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.41.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.42.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.42.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.42.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.42.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.42.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.42.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.43.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.43.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.43.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.43.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.43.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.43.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.44.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.44.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.44.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.44.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.44.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.44.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.45.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.45.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.45.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.45.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.45.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.45.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.46.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.46.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.46.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.46.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.46.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.46.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.47.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.47.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.47.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.47.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.47.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.47.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.48.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.48.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.48.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.48.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.48.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.48.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.49.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.49.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.49.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.49.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.49.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.49.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.5.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.5.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.5.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.5.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.5.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.5.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.50.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.50.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.50.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.50.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.50.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.50.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.51.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.51.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.51.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.51.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.51.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.51.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.52.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.52.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.52.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.52.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.52.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.52.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.53.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.53.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.53.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.53.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.53.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.53.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.54.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.54.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.54.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.54.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.54.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.54.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.55.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.55.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.55.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.55.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.55.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.55.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.56.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.56.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.56.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.56.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.56.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.56.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.57.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.57.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.57.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.57.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.57.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.57.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.58.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.58.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.58.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.58.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.58.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.58.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.59.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.59.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.59.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.59.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.59.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.59.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.6.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.6.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.6.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.6.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.6.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.6.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.60.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.60.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.60.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.60.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.60.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.60.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.61.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.61.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.61.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.61.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.61.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.61.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.62.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.62.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.62.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.62.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.62.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.62.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.63.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.63.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.63.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.63.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.63.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.63.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.64.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.64.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.64.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.64.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.64.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.64.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.65.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.65.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.65.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.65.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.65.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.65.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.66.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.66.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.66.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.66.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.66.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.66.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.67.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.67.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.67.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.67.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.67.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.67.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.68.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.68.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.68.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.68.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.68.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.68.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.69.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.69.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.69.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.69.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.69.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.69.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.7.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.7.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.7.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.7.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.7.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.7.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.70.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.70.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.70.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.70.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.70.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.70.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.71.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.71.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.71.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.71.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.71.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.71.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.72.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.72.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.72.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.72.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.72.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.72.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.73.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.73.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.73.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.73.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.73.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.73.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.74.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.74.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.74.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.74.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.74.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.74.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.75.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.75.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.75.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.75.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.75.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.75.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.76.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.76.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.76.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.76.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.76.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.76.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.77.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.77.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.77.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.77.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.77.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.77.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.78.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.78.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.78.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.78.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.78.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.78.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.79.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.79.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.79.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.79.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.79.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.79.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.8.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.8.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.8.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.8.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.8.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.8.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.80.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.80.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.80.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.80.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.80.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.80.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.81.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.81.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.81.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.81.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.81.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.81.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.82.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.82.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.82.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.82.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.82.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.82.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.83.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.83.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.83.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.83.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.83.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.83.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.84.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.84.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.84.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.84.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.84.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.84.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.85.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.85.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.85.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.85.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.85.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.85.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.86.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.86.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.86.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.86.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.86.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.86.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.87.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.87.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.87.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.87.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.87.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.87.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.88.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.88.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.88.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.88.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.88.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.88.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.89.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.89.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.89.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.89.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.89.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.89.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.9.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.9.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.9.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.9.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.9.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.9.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.90.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.90.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.90.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.90.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.90.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.90.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.91.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.91.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.91.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.91.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.91.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.91.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.92.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.92.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.92.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.92.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.92.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.92.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.93.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.93.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.93.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.93.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.93.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.93.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.94.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.94.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.94.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.94.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.94.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.94.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.95.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.95.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.95.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.95.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.95.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.95.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.96.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.96.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.96.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.96.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.96.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.96.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.97.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.97.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.97.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.97.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.97.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.97.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.98.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.98.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.98.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.98.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.98.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.98.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.99.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.99.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.99.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.99.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.99.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.experts.99.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.gate.e_score_correction_bias": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.gate.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.shared_experts.down_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.shared_experts.down_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.shared_experts.gate_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.shared_experts.gate_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.shared_experts.up_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.mlp.shared_experts.up_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.post_attention_layernorm.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.self_attn.k_norm.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.self_attn.k_proj.bias": "model-00060-of-00092.safetensors",
+ "model.layers.59.self_attn.k_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.self_attn.k_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.self_attn.o_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.self_attn.o_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.self_attn.q_norm.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.self_attn.q_proj.bias": "model-00060-of-00092.safetensors",
+ "model.layers.59.self_attn.q_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.self_attn.q_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.59.self_attn.v_proj.bias": "model-00060-of-00092.safetensors",
+ "model.layers.59.self_attn.v_proj.weight": "model-00060-of-00092.safetensors",
+ "model.layers.59.self_attn.v_proj.weight_scale": "model-00060-of-00092.safetensors",
+ "model.layers.6.input_layernorm.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.0.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.0.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.0.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.0.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.0.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.0.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.1.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.1.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.1.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.1.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.1.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.1.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.10.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.10.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.10.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.10.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.10.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.10.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.100.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.100.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.100.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.100.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.100.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.100.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.101.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.101.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.101.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.101.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.101.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.101.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.102.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.102.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.102.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.102.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.102.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.102.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.103.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.103.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.103.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.103.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.103.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.103.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.104.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.104.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.104.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.104.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.104.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.104.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.105.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.105.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.105.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.105.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.105.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.105.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.106.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.106.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.106.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.106.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.106.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.106.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.107.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.107.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.107.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.107.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.107.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.107.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.108.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.108.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.108.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.108.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.108.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.108.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.109.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.109.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.109.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.109.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.109.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.109.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.11.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.11.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.11.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.11.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.11.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.11.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.110.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.110.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.110.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.110.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.110.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.110.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.111.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.111.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.111.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.111.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.111.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.111.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.112.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.112.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.112.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.112.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.112.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.112.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.113.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.113.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.113.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.113.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.113.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.113.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.114.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.114.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.114.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.114.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.114.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.114.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.115.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.115.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.115.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.115.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.115.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.115.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.116.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.116.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.116.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.116.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.116.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.116.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.117.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.117.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.117.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.117.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.117.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.117.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.118.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.118.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.118.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.118.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.118.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.118.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.119.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.119.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.119.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.119.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.119.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.119.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.12.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.12.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.12.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.12.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.12.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.12.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.120.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.120.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.120.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.120.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.120.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.120.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.121.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.121.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.121.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.121.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.121.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.121.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.122.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.122.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.122.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.122.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.122.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.122.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.123.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.123.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.123.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.123.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.123.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.123.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.124.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.124.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.124.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.124.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.124.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.124.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.125.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.125.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.125.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.125.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.125.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.125.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.126.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.126.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.126.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.126.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.126.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.126.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.127.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.127.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.127.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.127.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.127.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.127.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.128.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.128.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.128.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.128.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.128.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.128.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.129.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.129.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.129.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.129.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.129.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.129.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.13.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.13.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.13.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.13.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.13.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.13.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.130.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.130.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.130.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.130.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.130.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.130.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.131.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.131.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.131.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.131.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.131.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.131.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.132.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.132.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.132.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.132.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.132.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.132.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.133.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.133.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.133.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.133.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.133.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.133.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.134.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.134.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.134.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.134.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.134.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.134.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.135.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.135.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.135.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.135.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.135.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.135.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.136.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.136.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.136.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.136.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.136.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.136.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.137.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.137.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.137.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.137.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.137.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.137.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.138.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.138.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.138.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.138.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.138.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.138.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.139.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.139.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.139.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.139.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.139.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.139.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.14.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.14.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.14.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.14.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.14.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.14.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.140.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.140.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.140.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.140.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.140.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.140.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.141.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.141.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.141.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.141.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.141.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.141.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.142.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.142.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.142.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.142.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.142.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.142.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.143.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.143.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.143.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.143.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.143.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.143.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.144.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.144.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.144.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.144.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.144.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.144.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.145.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.145.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.145.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.145.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.145.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.145.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.146.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.146.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.146.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.146.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.146.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.146.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.147.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.147.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.147.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.147.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.147.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.147.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.148.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.148.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.148.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.148.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.148.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.148.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.149.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.149.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.149.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.149.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.149.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.149.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.15.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.15.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.15.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.15.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.15.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.15.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.150.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.150.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.150.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.150.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.150.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.150.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.151.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.151.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.151.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.151.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.151.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.151.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.152.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.152.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.152.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.152.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.152.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.152.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.153.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.153.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.153.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.153.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.153.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.153.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.154.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.154.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.154.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.154.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.154.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.154.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.155.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.155.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.155.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.155.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.155.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.155.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.156.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.156.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.156.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.156.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.156.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.156.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.157.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.157.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.157.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.157.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.157.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.157.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.158.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.158.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.158.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.158.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.158.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.158.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.159.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.159.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.159.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.159.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.159.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.159.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.16.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.16.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.16.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.16.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.16.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.16.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.17.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.17.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.17.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.17.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.17.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.17.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.18.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.18.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.18.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.18.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.18.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.18.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.19.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.19.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.19.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.19.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.19.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.19.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.2.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.2.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.2.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.2.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.2.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.2.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.20.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.20.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.20.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.20.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.20.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.20.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.21.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.21.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.21.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.21.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.21.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.21.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.22.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.22.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.22.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.22.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.22.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.22.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.23.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.23.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.23.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.23.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.23.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.23.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.24.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.24.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.24.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.24.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.24.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.24.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.25.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.25.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.25.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.25.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.25.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.25.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.26.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.26.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.26.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.26.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.26.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.26.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.27.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.27.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.27.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.27.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.27.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.27.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.28.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.28.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.28.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.28.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.28.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.28.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.29.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.29.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.29.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.29.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.29.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.29.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.3.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.3.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.3.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.3.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.3.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.3.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.30.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.30.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.30.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.30.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.30.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.30.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.31.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.31.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.31.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.31.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.31.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.31.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.32.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.32.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.32.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.32.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.32.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.32.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.33.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.33.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.33.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.33.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.33.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.33.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.34.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.34.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.34.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.34.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.34.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.34.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.35.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.35.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.35.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.35.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.35.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.35.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.36.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.36.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.36.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.36.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.36.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.36.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.37.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.37.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.37.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.37.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.37.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.37.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.38.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.38.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.38.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.38.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.38.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.38.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.39.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.39.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.39.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.39.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.39.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.39.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.4.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.4.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.4.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.4.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.4.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.4.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.40.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.40.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.40.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.40.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.40.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.40.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.41.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.41.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.41.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.41.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.41.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.41.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.42.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.42.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.42.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.42.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.42.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.42.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.43.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.43.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.43.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.43.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.43.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.43.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.44.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.44.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.44.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.44.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.44.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.44.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.45.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.45.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.45.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.45.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.45.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.45.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.46.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.46.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.46.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.46.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.46.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.46.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.47.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.47.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.47.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.47.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.47.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.47.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.48.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.48.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.48.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.48.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.48.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.48.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.49.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.49.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.49.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.49.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.49.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.49.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.5.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.5.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.5.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.5.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.5.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.5.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.50.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.50.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.50.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.50.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.50.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.50.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.51.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.51.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.51.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.51.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.51.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.51.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.52.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.52.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.52.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.52.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.52.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.52.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.53.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.53.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.53.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.53.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.53.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.53.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.54.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.54.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.54.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.54.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.54.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.54.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.55.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.55.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.55.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.55.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.55.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.55.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.56.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.56.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.56.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.56.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.56.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.56.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.57.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.57.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.57.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.57.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.57.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.57.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.58.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.58.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.58.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.58.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.58.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.58.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.59.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.59.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.59.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.59.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.59.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.59.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.6.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.6.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.6.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.6.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.6.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.6.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.60.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.60.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.60.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.60.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.60.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.60.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.61.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.61.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.61.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.61.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.61.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.61.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.62.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.62.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.62.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.62.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.62.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.62.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.63.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.63.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.63.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.63.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.63.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.63.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.64.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.64.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.64.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.64.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.64.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.64.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.65.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.65.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.65.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.65.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.65.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.65.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.66.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.66.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.66.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.66.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.66.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.66.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.67.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.67.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.67.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.67.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.67.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.67.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.68.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.68.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.68.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.68.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.68.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.68.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.69.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.69.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.69.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.69.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.69.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.69.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.7.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.7.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.7.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.7.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.7.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.7.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.70.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.70.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.70.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.70.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.70.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.70.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.71.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.71.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.71.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.71.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.71.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.71.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.72.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.72.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.72.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.72.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.72.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.72.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.73.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.73.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.73.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.73.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.73.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.73.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.74.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.74.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.74.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.74.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.74.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.74.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.75.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.75.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.75.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.75.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.75.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.75.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.76.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.76.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.76.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.76.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.76.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.76.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.77.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.77.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.77.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.77.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.77.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.77.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.78.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.78.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.78.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.78.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.78.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.78.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.79.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.79.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.79.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.79.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.79.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.79.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.8.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.8.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.8.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.8.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.8.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.8.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.80.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.80.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.80.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.80.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.80.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.80.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.81.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.81.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.81.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.81.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.81.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.81.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.82.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.82.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.82.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.82.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.82.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.82.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.83.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.83.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.83.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.83.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.83.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.83.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.84.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.84.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.84.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.84.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.84.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.84.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.85.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.85.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.85.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.85.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.85.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.85.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.86.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.86.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.86.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.86.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.86.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.86.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.87.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.87.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.87.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.87.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.87.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.87.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.88.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.88.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.88.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.88.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.88.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.88.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.89.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.89.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.89.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.89.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.89.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.89.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.9.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.9.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.9.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.9.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.9.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.9.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.90.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.90.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.90.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.90.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.90.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.90.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.91.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.91.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.91.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.91.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.91.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.91.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.92.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.92.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.92.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.92.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.92.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.92.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.93.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.93.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.93.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.93.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.93.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.93.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.94.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.94.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.94.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.94.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.94.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.94.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.95.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.95.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.95.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.95.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.95.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.95.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.96.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.96.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.96.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.96.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.96.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.96.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.97.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.97.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.97.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.97.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.97.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.97.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.98.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.98.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.98.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.98.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.98.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.98.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.99.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.99.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.99.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.99.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.99.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.experts.99.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.gate.e_score_correction_bias": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.gate.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.shared_experts.down_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.shared_experts.down_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.shared_experts.gate_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.shared_experts.gate_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.shared_experts.up_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.mlp.shared_experts.up_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.post_attention_layernorm.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.self_attn.k_norm.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.self_attn.k_proj.bias": "model-00007-of-00092.safetensors",
+ "model.layers.6.self_attn.k_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.self_attn.k_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.self_attn.o_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.self_attn.o_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.self_attn.q_norm.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.self_attn.q_proj.bias": "model-00007-of-00092.safetensors",
+ "model.layers.6.self_attn.q_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.self_attn.q_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.6.self_attn.v_proj.bias": "model-00007-of-00092.safetensors",
+ "model.layers.6.self_attn.v_proj.weight": "model-00007-of-00092.safetensors",
+ "model.layers.6.self_attn.v_proj.weight_scale": "model-00007-of-00092.safetensors",
+ "model.layers.60.input_layernorm.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.0.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.0.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.0.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.0.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.0.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.0.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.1.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.1.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.1.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.1.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.1.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.1.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.10.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.10.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.10.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.10.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.10.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.10.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.100.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.100.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.100.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.100.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.100.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.100.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.101.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.101.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.101.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.101.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.101.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.101.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.102.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.102.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.102.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.102.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.102.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.102.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.103.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.103.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.103.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.103.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.103.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.103.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.104.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.104.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.104.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.104.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.104.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.104.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.105.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.105.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.105.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.105.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.105.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.105.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.106.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.106.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.106.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.106.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.106.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.106.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.107.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.107.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.107.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.107.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.107.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.107.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.108.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.108.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.108.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.108.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.108.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.108.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.109.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.109.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.109.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.109.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.109.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.109.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.11.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.11.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.11.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.11.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.11.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.11.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.110.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.110.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.110.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.110.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.110.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.110.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.111.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.111.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.111.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.111.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.111.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.111.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.112.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.112.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.112.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.112.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.112.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.112.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.113.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.113.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.113.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.113.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.113.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.113.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.114.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.114.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.114.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.114.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.114.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.114.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.115.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.115.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.115.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.115.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.115.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.115.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.116.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.116.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.116.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.116.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.116.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.116.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.117.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.117.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.117.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.117.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.117.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.117.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.118.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.118.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.118.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.118.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.118.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.118.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.119.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.119.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.119.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.119.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.119.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.119.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.12.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.12.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.12.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.12.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.12.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.12.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.120.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.120.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.120.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.120.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.120.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.120.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.121.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.121.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.121.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.121.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.121.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.121.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.122.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.122.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.122.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.122.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.122.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.122.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.123.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.123.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.123.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.123.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.123.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.123.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.124.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.124.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.124.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.124.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.124.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.124.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.125.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.125.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.125.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.125.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.125.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.125.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.126.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.126.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.126.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.126.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.126.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.126.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.127.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.127.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.127.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.127.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.127.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.127.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.128.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.128.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.128.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.128.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.128.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.128.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.129.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.129.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.129.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.129.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.129.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.129.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.13.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.13.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.13.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.13.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.13.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.13.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.130.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.130.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.130.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.130.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.130.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.130.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.131.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.131.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.131.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.131.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.131.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.131.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.132.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.132.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.132.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.132.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.132.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.132.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.133.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.133.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.133.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.133.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.133.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.133.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.134.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.134.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.134.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.134.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.134.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.134.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.135.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.135.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.135.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.135.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.135.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.135.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.136.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.136.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.136.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.136.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.136.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.136.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.137.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.137.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.137.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.137.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.137.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.137.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.138.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.138.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.138.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.138.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.138.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.138.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.139.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.139.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.139.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.139.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.139.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.139.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.14.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.14.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.14.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.14.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.14.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.14.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.140.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.140.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.140.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.140.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.140.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.140.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.141.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.141.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.141.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.141.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.141.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.141.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.142.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.142.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.142.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.142.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.142.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.142.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.143.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.143.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.143.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.143.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.143.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.143.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.144.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.144.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.144.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.144.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.144.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.144.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.145.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.145.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.145.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.145.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.145.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.145.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.146.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.146.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.146.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.146.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.146.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.146.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.147.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.147.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.147.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.147.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.147.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.147.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.148.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.148.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.148.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.148.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.148.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.148.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.149.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.149.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.149.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.149.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.149.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.149.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.15.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.15.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.15.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.15.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.15.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.15.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.150.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.150.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.150.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.150.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.150.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.150.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.151.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.151.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.151.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.151.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.151.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.151.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.152.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.152.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.152.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.152.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.152.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.152.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.153.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.153.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.153.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.153.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.153.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.153.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.154.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.154.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.154.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.154.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.154.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.154.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.155.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.155.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.155.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.155.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.155.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.155.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.156.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.156.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.156.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.156.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.156.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.156.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.157.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.157.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.157.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.157.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.157.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.157.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.158.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.158.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.158.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.158.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.158.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.158.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.159.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.159.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.159.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.159.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.159.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.159.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.16.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.16.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.16.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.16.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.16.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.16.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.17.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.17.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.17.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.17.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.17.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.17.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.18.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.18.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.18.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.18.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.18.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.18.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.19.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.19.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.19.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.19.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.19.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.19.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.2.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.2.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.2.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.2.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.2.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.2.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.20.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.20.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.20.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.20.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.20.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.20.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.21.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.21.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.21.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.21.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.21.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.21.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.22.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.22.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.22.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.22.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.22.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.22.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.23.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.23.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.23.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.23.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.23.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.23.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.24.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.24.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.24.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.24.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.24.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.24.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.25.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.25.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.25.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.25.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.25.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.25.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.26.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.26.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.26.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.26.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.26.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.26.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.27.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.27.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.27.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.27.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.27.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.27.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.28.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.28.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.28.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.28.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.28.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.28.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.29.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.29.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.29.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.29.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.29.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.29.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.3.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.3.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.3.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.3.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.3.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.3.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.30.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.30.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.30.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.30.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.30.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.30.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.31.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.31.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.31.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.31.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.31.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.31.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.32.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.32.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.32.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.32.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.32.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.32.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.33.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.33.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.33.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.33.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.33.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.33.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.34.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.34.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.34.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.34.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.34.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.34.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.35.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.35.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.35.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.35.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.35.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.35.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.36.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.36.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.36.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.36.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.36.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.36.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.37.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.37.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.37.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.37.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.37.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.37.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.38.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.38.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.38.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.38.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.38.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.38.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.39.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.39.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.39.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.39.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.39.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.39.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.4.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.4.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.4.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.4.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.4.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.4.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.40.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.40.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.40.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.40.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.40.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.40.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.41.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.41.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.41.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.41.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.41.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.41.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.42.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.42.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.42.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.42.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.42.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.42.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.43.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.43.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.43.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.43.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.43.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.43.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.44.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.44.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.44.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.44.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.44.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.44.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.45.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.45.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.45.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.45.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.45.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.45.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.46.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.46.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.46.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.46.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.46.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.46.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.47.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.47.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.47.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.47.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.47.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.47.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.48.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.48.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.48.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.48.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.48.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.48.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.49.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.49.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.49.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.49.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.49.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.49.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.5.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.5.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.5.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.5.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.5.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.5.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.50.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.50.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.50.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.50.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.50.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.50.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.51.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.51.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.51.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.51.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.51.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.51.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.52.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.52.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.52.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.52.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.52.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.52.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.53.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.53.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.53.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.53.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.53.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.53.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.54.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.54.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.54.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.54.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.54.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.54.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.55.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.55.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.55.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.55.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.55.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.55.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.56.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.56.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.56.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.56.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.56.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.56.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.57.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.57.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.57.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.57.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.57.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.57.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.58.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.58.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.58.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.58.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.58.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.58.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.59.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.59.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.59.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.59.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.59.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.59.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.6.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.6.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.6.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.6.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.6.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.6.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.60.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.60.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.60.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.60.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.60.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.60.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.61.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.61.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.61.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.61.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.61.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.61.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.62.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.62.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.62.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.62.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.62.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.62.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.63.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.63.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.63.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.63.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.63.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.63.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.64.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.64.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.64.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.64.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.64.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.64.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.65.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.65.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.65.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.65.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.65.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.65.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.66.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.66.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.66.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.66.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.66.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.66.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.67.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.67.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.67.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.67.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.67.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.67.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.68.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.68.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.68.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.68.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.68.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.68.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.69.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.69.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.69.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.69.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.69.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.69.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.7.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.7.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.7.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.7.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.7.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.7.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.70.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.70.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.70.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.70.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.70.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.70.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.71.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.71.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.71.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.71.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.71.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.71.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.72.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.72.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.72.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.72.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.72.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.72.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.73.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.73.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.73.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.73.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.73.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.73.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.74.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.74.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.74.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.74.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.74.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.74.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.75.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.75.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.75.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.75.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.75.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.75.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.76.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.76.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.76.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.76.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.76.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.76.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.77.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.77.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.77.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.77.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.77.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.77.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.78.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.78.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.78.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.78.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.78.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.78.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.79.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.79.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.79.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.79.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.79.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.79.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.8.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.8.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.8.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.8.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.8.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.8.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.80.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.80.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.80.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.80.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.80.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.80.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.81.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.81.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.81.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.81.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.81.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.81.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.82.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.82.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.82.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.82.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.82.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.82.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.83.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.83.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.83.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.83.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.83.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.83.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.84.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.84.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.84.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.84.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.84.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.84.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.85.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.85.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.85.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.85.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.85.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.85.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.86.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.86.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.86.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.86.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.86.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.86.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.87.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.87.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.87.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.87.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.87.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.87.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.88.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.88.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.88.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.88.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.88.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.88.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.89.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.89.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.89.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.89.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.89.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.89.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.9.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.9.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.9.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.9.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.9.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.9.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.90.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.90.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.90.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.90.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.90.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.90.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.91.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.91.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.91.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.91.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.91.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.91.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.92.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.92.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.92.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.92.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.92.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.92.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.93.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.93.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.93.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.93.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.93.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.93.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.94.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.94.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.94.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.94.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.94.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.94.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.95.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.95.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.95.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.95.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.95.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.95.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.96.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.96.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.96.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.96.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.96.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.96.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.97.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.97.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.97.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.97.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.97.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.97.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.98.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.98.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.98.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.98.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.98.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.98.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.99.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.99.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.99.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.99.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.99.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.experts.99.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.gate.e_score_correction_bias": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.gate.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.shared_experts.down_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.shared_experts.down_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.shared_experts.gate_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.shared_experts.gate_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.shared_experts.up_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.mlp.shared_experts.up_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.post_attention_layernorm.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.self_attn.k_norm.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.self_attn.k_proj.bias": "model-00061-of-00092.safetensors",
+ "model.layers.60.self_attn.k_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.self_attn.k_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.self_attn.o_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.self_attn.o_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.self_attn.q_norm.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.self_attn.q_proj.bias": "model-00061-of-00092.safetensors",
+ "model.layers.60.self_attn.q_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.self_attn.q_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.60.self_attn.v_proj.bias": "model-00061-of-00092.safetensors",
+ "model.layers.60.self_attn.v_proj.weight": "model-00061-of-00092.safetensors",
+ "model.layers.60.self_attn.v_proj.weight_scale": "model-00061-of-00092.safetensors",
+ "model.layers.61.input_layernorm.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.0.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.0.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.0.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.0.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.0.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.0.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.1.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.1.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.1.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.1.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.1.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.1.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.10.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.10.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.10.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.10.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.10.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.10.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.100.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.100.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.100.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.100.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.100.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.100.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.101.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.101.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.101.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.101.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.101.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.101.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.102.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.102.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.102.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.102.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.102.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.102.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.103.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.103.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.103.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.103.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.103.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.103.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.104.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.104.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.104.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.104.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.104.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.104.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.105.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.105.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.105.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.105.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.105.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.105.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.106.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.106.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.106.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.106.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.106.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.106.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.107.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.107.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.107.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.107.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.107.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.107.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.108.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.108.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.108.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.108.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.108.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.108.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.109.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.109.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.109.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.109.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.109.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.109.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.11.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.11.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.11.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.11.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.11.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.11.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.110.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.110.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.110.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.110.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.110.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.110.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.111.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.111.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.111.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.111.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.111.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.111.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.112.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.112.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.112.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.112.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.112.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.112.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.113.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.113.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.113.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.113.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.113.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.113.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.114.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.114.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.114.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.114.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.114.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.114.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.115.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.115.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.115.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.115.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.115.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.115.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.116.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.116.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.116.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.116.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.116.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.116.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.117.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.117.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.117.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.117.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.117.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.117.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.118.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.118.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.118.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.118.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.118.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.118.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.119.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.119.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.119.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.119.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.119.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.119.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.12.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.12.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.12.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.12.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.12.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.12.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.120.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.120.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.120.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.120.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.120.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.120.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.121.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.121.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.121.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.121.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.121.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.121.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.122.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.122.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.122.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.122.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.122.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.122.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.123.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.123.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.123.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.123.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.123.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.123.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.124.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.124.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.124.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.124.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.124.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.124.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.125.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.125.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.125.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.125.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.125.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.125.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.126.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.126.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.126.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.126.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.126.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.126.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.127.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.127.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.127.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.127.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.127.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.127.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.128.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.128.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.128.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.128.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.128.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.128.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.129.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.129.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.129.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.129.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.129.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.129.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.13.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.13.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.13.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.13.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.13.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.13.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.130.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.130.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.130.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.130.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.130.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.130.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.131.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.131.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.131.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.131.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.131.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.131.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.132.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.132.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.132.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.132.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.132.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.132.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.133.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.133.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.133.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.133.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.133.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.133.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.134.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.134.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.134.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.134.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.134.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.134.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.135.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.135.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.135.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.135.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.135.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.135.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.136.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.136.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.136.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.136.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.136.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.136.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.137.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.137.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.137.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.137.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.137.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.137.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.138.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.138.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.138.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.138.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.138.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.138.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.139.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.139.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.139.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.139.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.139.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.139.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.14.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.14.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.14.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.14.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.14.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.14.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.140.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.140.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.140.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.140.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.140.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.140.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.141.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.141.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.141.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.141.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.141.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.141.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.142.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.142.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.142.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.142.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.142.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.142.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.143.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.143.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.143.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.143.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.143.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.143.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.144.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.144.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.144.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.144.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.144.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.144.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.145.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.145.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.145.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.145.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.145.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.145.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.146.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.146.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.146.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.146.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.146.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.146.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.147.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.147.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.147.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.147.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.147.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.147.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.148.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.148.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.148.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.148.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.148.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.148.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.149.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.149.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.149.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.149.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.149.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.149.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.15.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.15.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.15.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.15.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.15.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.15.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.150.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.150.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.150.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.150.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.150.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.150.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.151.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.151.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.151.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.151.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.151.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.151.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.152.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.152.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.152.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.152.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.152.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.152.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.153.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.153.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.153.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.153.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.153.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.153.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.154.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.154.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.154.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.154.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.154.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.154.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.155.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.155.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.155.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.155.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.155.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.155.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.156.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.156.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.156.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.156.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.156.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.156.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.157.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.157.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.157.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.157.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.157.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.157.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.158.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.158.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.158.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.158.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.158.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.158.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.159.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.159.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.159.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.159.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.159.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.159.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.16.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.16.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.16.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.16.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.16.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.16.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.17.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.17.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.17.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.17.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.17.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.17.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.18.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.18.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.18.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.18.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.18.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.18.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.19.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.19.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.19.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.19.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.19.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.19.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.2.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.2.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.2.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.2.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.2.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.2.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.20.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.20.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.20.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.20.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.20.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.20.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.21.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.21.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.21.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.21.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.21.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.21.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.22.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.22.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.22.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.22.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.22.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.22.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.23.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.23.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.23.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.23.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.23.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.23.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.24.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.24.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.24.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.24.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.24.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.24.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.25.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.25.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.25.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.25.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.25.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.25.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.26.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.26.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.26.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.26.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.26.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.26.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.27.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.27.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.27.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.27.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.27.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.27.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.28.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.28.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.28.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.28.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.28.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.28.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.29.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.29.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.29.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.29.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.29.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.29.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.3.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.3.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.3.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.3.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.3.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.3.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.30.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.30.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.30.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.30.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.30.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.30.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.31.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.31.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.31.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.31.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.31.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.31.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.32.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.32.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.32.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.32.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.32.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.32.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.33.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.33.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.33.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.33.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.33.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.33.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.34.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.34.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.34.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.34.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.34.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.34.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.35.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.35.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.35.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.35.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.35.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.35.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.36.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.36.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.36.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.36.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.36.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.36.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.37.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.37.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.37.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.37.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.37.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.37.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.38.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.38.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.38.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.38.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.38.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.38.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.39.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.39.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.39.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.39.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.39.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.39.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.4.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.4.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.4.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.4.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.4.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.4.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.40.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.40.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.40.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.40.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.40.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.40.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.41.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.41.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.41.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.41.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.41.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.41.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.42.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.42.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.42.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.42.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.42.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.42.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.43.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.43.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.43.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.43.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.43.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.43.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.44.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.44.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.44.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.44.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.44.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.44.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.45.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.45.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.45.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.45.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.45.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.45.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.46.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.46.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.46.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.46.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.46.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.46.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.47.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.47.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.47.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.47.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.47.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.47.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.48.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.48.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.48.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.48.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.48.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.48.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.49.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.49.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.49.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.49.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.49.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.49.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.5.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.5.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.5.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.5.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.5.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.5.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.50.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.50.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.50.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.50.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.50.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.50.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.51.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.51.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.51.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.51.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.51.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.51.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.52.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.52.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.52.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.52.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.52.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.52.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.53.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.53.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.53.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.53.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.53.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.53.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.54.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.54.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.54.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.54.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.54.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.54.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.55.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.55.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.55.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.55.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.55.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.55.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.56.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.56.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.56.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.56.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.56.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.56.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.57.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.57.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.57.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.57.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.57.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.57.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.58.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.58.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.58.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.58.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.58.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.58.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.59.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.59.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.59.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.59.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.59.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.59.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.6.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.6.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.6.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.6.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.6.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.6.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.60.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.60.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.60.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.60.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.60.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.60.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.61.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.61.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.61.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.61.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.61.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.61.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.62.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.62.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.62.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.62.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.62.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.62.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.63.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.63.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.63.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.63.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.63.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.63.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.64.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.64.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.64.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.64.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.64.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.64.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.65.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.65.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.65.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.65.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.65.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.65.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.66.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.66.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.66.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.66.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.66.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.66.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.67.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.67.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.67.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.67.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.67.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.67.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.68.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.68.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.68.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.68.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.68.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.68.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.69.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.69.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.69.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.69.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.69.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.69.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.7.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.7.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.7.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.7.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.7.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.7.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.70.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.70.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.70.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.70.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.70.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.70.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.71.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.71.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.71.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.71.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.71.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.71.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.72.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.72.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.72.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.72.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.72.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.72.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.73.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.73.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.73.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.73.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.73.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.73.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.74.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.74.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.74.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.74.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.74.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.74.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.75.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.75.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.75.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.75.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.75.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.75.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.76.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.76.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.76.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.76.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.76.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.76.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.77.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.77.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.77.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.77.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.77.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.77.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.78.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.78.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.78.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.78.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.78.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.78.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.79.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.79.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.79.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.79.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.79.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.79.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.8.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.8.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.8.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.8.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.8.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.8.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.80.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.80.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.80.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.80.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.80.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.80.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.81.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.81.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.81.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.81.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.81.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.81.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.82.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.82.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.82.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.82.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.82.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.82.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.83.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.83.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.83.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.83.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.83.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.83.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.84.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.84.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.84.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.84.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.84.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.84.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.85.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.85.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.85.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.85.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.85.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.85.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.86.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.86.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.86.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.86.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.86.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.86.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.87.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.87.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.87.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.87.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.87.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.87.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.88.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.88.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.88.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.88.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.88.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.88.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.89.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.89.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.89.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.89.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.89.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.89.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.9.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.9.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.9.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.9.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.9.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.9.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.90.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.90.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.90.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.90.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.90.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.90.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.91.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.91.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.91.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.91.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.91.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.91.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.92.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.92.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.92.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.92.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.92.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.92.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.93.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.93.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.93.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.93.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.93.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.93.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.94.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.94.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.94.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.94.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.94.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.94.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.95.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.95.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.95.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.95.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.95.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.95.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.96.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.96.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.96.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.96.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.96.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.96.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.97.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.97.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.97.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.97.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.97.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.97.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.98.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.98.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.98.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.98.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.98.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.98.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.99.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.99.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.99.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.99.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.99.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.experts.99.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.gate.e_score_correction_bias": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.gate.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.shared_experts.down_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.shared_experts.down_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.shared_experts.gate_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.shared_experts.gate_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.shared_experts.up_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.mlp.shared_experts.up_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.post_attention_layernorm.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.self_attn.k_norm.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.self_attn.k_proj.bias": "model-00062-of-00092.safetensors",
+ "model.layers.61.self_attn.k_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.self_attn.k_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.self_attn.o_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.self_attn.o_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.self_attn.q_norm.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.self_attn.q_proj.bias": "model-00062-of-00092.safetensors",
+ "model.layers.61.self_attn.q_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.self_attn.q_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.61.self_attn.v_proj.bias": "model-00062-of-00092.safetensors",
+ "model.layers.61.self_attn.v_proj.weight": "model-00062-of-00092.safetensors",
+ "model.layers.61.self_attn.v_proj.weight_scale": "model-00062-of-00092.safetensors",
+ "model.layers.62.input_layernorm.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.0.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.0.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.0.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.0.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.0.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.0.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.1.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.1.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.1.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.1.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.1.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.1.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.10.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.10.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.10.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.10.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.10.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.10.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.100.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.100.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.100.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.100.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.100.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.100.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.101.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.101.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.101.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.101.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.101.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.101.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.102.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.102.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.102.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.102.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.102.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.102.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.103.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.103.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.103.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.103.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.103.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.103.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.104.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.104.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.104.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.104.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.104.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.104.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.105.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.105.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.105.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.105.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.105.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.105.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.106.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.106.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.106.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.106.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.106.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.106.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.107.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.107.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.107.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.107.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.107.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.107.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.108.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.108.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.108.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.108.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.108.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.108.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.109.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.109.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.109.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.109.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.109.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.109.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.11.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.11.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.11.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.11.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.11.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.11.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.110.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.110.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.110.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.110.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.110.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.110.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.111.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.111.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.111.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.111.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.111.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.111.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.112.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.112.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.112.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.112.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.112.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.112.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.113.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.113.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.113.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.113.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.113.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.113.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.114.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.114.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.114.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.114.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.114.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.114.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.115.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.115.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.115.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.115.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.115.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.115.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.116.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.116.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.116.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.116.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.116.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.116.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.117.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.117.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.117.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.117.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.117.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.117.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.118.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.118.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.118.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.118.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.118.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.118.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.119.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.119.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.119.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.119.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.119.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.119.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.12.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.12.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.12.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.12.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.12.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.12.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.120.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.120.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.120.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.120.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.120.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.120.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.121.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.121.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.121.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.121.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.121.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.121.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.122.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.122.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.122.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.122.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.122.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.122.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.123.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.123.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.123.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.123.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.123.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.123.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.124.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.124.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.124.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.124.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.124.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.124.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.125.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.125.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.125.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.125.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.125.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.125.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.126.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.126.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.126.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.126.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.126.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.126.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.127.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.127.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.127.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.127.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.127.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.127.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.128.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.128.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.128.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.128.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.128.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.128.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.129.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.129.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.129.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.129.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.129.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.129.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.13.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.13.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.13.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.13.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.13.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.13.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.130.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.130.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.130.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.130.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.130.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.130.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.131.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.131.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.131.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.131.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.131.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.131.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.132.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.132.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.132.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.132.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.132.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.132.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.133.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.133.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.133.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.133.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.133.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.133.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.134.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.134.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.134.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.134.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.134.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.134.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.135.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.135.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.135.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.135.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.135.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.135.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.136.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.136.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.136.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.136.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.136.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.136.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.137.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.137.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.137.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.137.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.137.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.137.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.138.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.138.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.138.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.138.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.138.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.138.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.139.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.139.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.139.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.139.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.139.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.139.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.14.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.14.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.14.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.14.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.14.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.14.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.140.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.140.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.140.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.140.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.140.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.140.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.141.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.141.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.141.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.141.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.141.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.141.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.142.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.142.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.142.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.142.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.142.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.142.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.143.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.143.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.143.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.143.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.143.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.143.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.144.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.144.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.144.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.144.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.144.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.144.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.145.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.145.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.145.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.145.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.145.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.145.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.146.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.146.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.146.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.146.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.146.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.146.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.147.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.147.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.147.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.147.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.147.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.147.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.148.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.148.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.148.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.148.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.148.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.148.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.149.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.149.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.149.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.149.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.149.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.149.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.15.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.15.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.15.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.15.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.15.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.15.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.150.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.150.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.150.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.150.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.150.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.150.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.151.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.151.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.151.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.151.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.151.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.151.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.152.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.152.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.152.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.152.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.152.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.152.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.153.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.153.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.153.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.153.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.153.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.153.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.154.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.154.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.154.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.154.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.154.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.154.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.155.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.155.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.155.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.155.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.155.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.155.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.156.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.156.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.156.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.156.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.156.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.156.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.157.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.157.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.157.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.157.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.157.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.157.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.158.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.158.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.158.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.158.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.158.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.158.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.159.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.159.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.159.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.159.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.159.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.159.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.16.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.16.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.16.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.16.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.16.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.16.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.17.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.17.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.17.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.17.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.17.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.17.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.18.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.18.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.18.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.18.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.18.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.18.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.19.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.19.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.19.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.19.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.19.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.19.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.2.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.2.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.2.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.2.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.2.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.2.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.20.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.20.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.20.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.20.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.20.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.20.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.21.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.21.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.21.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.21.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.21.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.21.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.22.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.22.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.22.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.22.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.22.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.22.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.23.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.23.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.23.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.23.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.23.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.23.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.24.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.24.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.24.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.24.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.24.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.24.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.25.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.25.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.25.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.25.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.25.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.25.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.26.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.26.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.26.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.26.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.26.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.26.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.27.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.27.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.27.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.27.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.27.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.27.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.28.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.28.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.28.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.28.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.28.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.28.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.29.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.29.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.29.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.29.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.29.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.29.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.3.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.3.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.3.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.3.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.3.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.3.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.30.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.30.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.30.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.30.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.30.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.30.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.31.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.31.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.31.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.31.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.31.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.31.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.32.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.32.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.32.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.32.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.32.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.32.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.33.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.33.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.33.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.33.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.33.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.33.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.34.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.34.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.34.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.34.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.34.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.34.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.35.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.35.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.35.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.35.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.35.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.35.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.36.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.36.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.36.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.36.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.36.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.36.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.37.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.37.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.37.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.37.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.37.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.37.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.38.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.38.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.38.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.38.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.38.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.38.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.39.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.39.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.39.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.39.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.39.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.39.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.4.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.4.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.4.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.4.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.4.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.4.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.40.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.40.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.40.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.40.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.40.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.40.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.41.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.41.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.41.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.41.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.41.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.41.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.42.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.42.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.42.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.42.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.42.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.42.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.43.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.43.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.43.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.43.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.43.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.43.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.44.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.44.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.44.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.44.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.44.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.44.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.45.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.45.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.45.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.45.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.45.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.45.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.46.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.46.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.46.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.46.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.46.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.46.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.47.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.47.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.47.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.47.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.47.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.47.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.48.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.48.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.48.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.48.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.48.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.48.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.49.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.49.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.49.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.49.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.49.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.49.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.5.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.5.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.5.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.5.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.5.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.5.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.50.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.50.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.50.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.50.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.50.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.50.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.51.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.51.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.51.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.51.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.51.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.51.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.52.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.52.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.52.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.52.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.52.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.52.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.53.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.53.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.53.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.53.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.53.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.53.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.54.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.54.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.54.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.54.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.54.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.54.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.55.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.55.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.55.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.55.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.55.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.55.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.56.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.56.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.56.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.56.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.56.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.56.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.57.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.57.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.57.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.57.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.57.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.57.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.58.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.58.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.58.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.58.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.58.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.58.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.59.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.59.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.59.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.59.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.59.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.59.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.6.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.6.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.6.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.6.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.6.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.6.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.60.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.60.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.60.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.60.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.60.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.60.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.61.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.61.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.61.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.61.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.61.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.61.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.62.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.62.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.62.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.62.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.62.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.62.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.63.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.63.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.63.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.63.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.63.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.63.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.64.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.64.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.64.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.64.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.64.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.64.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.65.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.65.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.65.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.65.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.65.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.65.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.66.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.66.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.66.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.66.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.66.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.66.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.67.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.67.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.67.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.67.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.67.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.67.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.68.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.68.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.68.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.68.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.68.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.68.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.69.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.69.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.69.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.69.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.69.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.69.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.7.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.7.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.7.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.7.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.7.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.7.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.70.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.70.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.70.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.70.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.70.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.70.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.71.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.71.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.71.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.71.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.71.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.71.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.72.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.72.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.72.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.72.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.72.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.72.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.73.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.73.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.73.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.73.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.73.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.73.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.74.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.74.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.74.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.74.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.74.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.74.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.75.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.75.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.75.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.75.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.75.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.75.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.76.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.76.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.76.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.76.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.76.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.76.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.77.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.77.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.77.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.77.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.77.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.77.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.78.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.78.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.78.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.78.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.78.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.78.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.79.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.79.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.79.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.79.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.79.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.79.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.8.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.8.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.8.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.8.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.8.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.8.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.80.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.80.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.80.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.80.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.80.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.80.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.81.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.81.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.81.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.81.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.81.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.81.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.82.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.82.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.82.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.82.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.82.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.82.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.83.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.83.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.83.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.83.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.83.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.83.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.84.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.84.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.84.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.84.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.84.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.84.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.85.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.85.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.85.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.85.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.85.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.85.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.86.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.86.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.86.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.86.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.86.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.86.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.87.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.87.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.87.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.87.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.87.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.87.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.88.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.88.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.88.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.88.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.88.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.88.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.89.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.89.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.89.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.89.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.89.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.89.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.9.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.9.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.9.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.9.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.9.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.9.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.90.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.90.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.90.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.90.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.90.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.90.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.91.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.91.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.91.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.91.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.91.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.91.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.92.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.92.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.92.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.92.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.92.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.92.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.93.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.93.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.93.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.93.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.93.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.93.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.94.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.94.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.94.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.94.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.94.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.94.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.95.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.95.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.95.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.95.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.95.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.95.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.96.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.96.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.96.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.96.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.96.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.96.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.97.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.97.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.97.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.97.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.97.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.97.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.98.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.98.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.98.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.98.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.98.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.98.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.99.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.99.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.99.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.99.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.99.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.experts.99.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.gate.e_score_correction_bias": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.gate.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.shared_experts.down_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.shared_experts.down_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.shared_experts.gate_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.shared_experts.gate_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.shared_experts.up_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.mlp.shared_experts.up_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.post_attention_layernorm.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.self_attn.k_norm.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.self_attn.k_proj.bias": "model-00063-of-00092.safetensors",
+ "model.layers.62.self_attn.k_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.self_attn.k_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.self_attn.o_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.self_attn.o_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.self_attn.q_norm.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.self_attn.q_proj.bias": "model-00063-of-00092.safetensors",
+ "model.layers.62.self_attn.q_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.self_attn.q_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.62.self_attn.v_proj.bias": "model-00063-of-00092.safetensors",
+ "model.layers.62.self_attn.v_proj.weight": "model-00063-of-00092.safetensors",
+ "model.layers.62.self_attn.v_proj.weight_scale": "model-00063-of-00092.safetensors",
+ "model.layers.63.input_layernorm.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.0.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.0.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.0.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.0.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.0.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.0.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.1.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.1.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.1.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.1.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.1.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.1.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.10.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.10.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.10.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.10.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.10.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.10.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.100.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.100.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.100.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.100.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.100.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.100.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.101.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.101.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.101.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.101.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.101.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.101.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.102.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.102.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.102.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.102.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.102.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.102.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.103.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.103.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.103.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.103.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.103.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.103.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.104.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.104.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.104.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.104.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.104.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.104.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.105.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.105.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.105.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.105.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.105.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.105.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.106.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.106.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.106.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.106.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.106.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.106.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.107.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.107.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.107.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.107.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.107.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.107.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.108.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.108.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.108.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.108.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.108.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.108.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.109.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.109.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.109.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.109.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.109.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.109.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.11.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.11.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.11.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.11.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.11.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.11.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.110.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.110.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.110.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.110.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.110.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.110.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.111.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.111.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.111.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.111.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.111.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.111.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.112.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.112.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.112.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.112.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.112.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.112.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.113.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.113.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.113.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.113.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.113.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.113.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.114.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.114.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.114.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.114.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.114.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.114.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.115.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.115.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.115.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.115.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.115.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.115.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.116.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.116.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.116.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.116.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.116.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.116.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.117.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.117.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.117.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.117.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.117.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.117.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.118.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.118.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.118.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.118.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.118.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.118.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.119.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.119.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.119.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.119.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.119.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.119.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.12.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.12.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.12.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.12.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.12.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.12.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.120.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.120.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.120.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.120.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.120.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.120.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.121.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.121.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.121.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.121.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.121.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.121.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.122.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.122.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.122.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.122.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.122.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.122.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.123.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.123.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.123.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.123.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.123.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.123.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.124.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.124.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.124.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.124.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.124.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.124.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.125.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.125.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.125.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.125.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.125.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.125.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.126.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.126.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.126.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.126.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.126.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.126.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.127.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.127.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.127.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.127.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.127.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.127.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.128.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.128.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.128.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.128.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.128.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.128.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.129.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.129.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.129.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.129.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.129.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.129.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.13.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.13.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.13.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.13.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.13.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.13.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.130.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.130.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.130.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.130.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.130.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.130.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.131.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.131.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.131.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.131.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.131.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.131.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.132.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.132.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.132.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.132.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.132.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.132.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.133.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.133.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.133.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.133.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.133.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.133.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.134.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.134.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.134.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.134.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.134.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.134.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.135.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.135.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.135.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.135.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.135.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.135.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.136.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.136.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.136.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.136.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.136.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.136.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.137.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.137.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.137.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.137.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.137.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.137.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.138.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.138.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.138.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.138.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.138.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.138.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.139.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.139.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.139.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.139.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.139.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.139.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.14.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.14.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.14.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.14.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.14.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.14.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.140.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.140.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.140.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.140.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.140.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.140.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.141.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.141.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.141.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.141.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.141.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.141.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.142.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.142.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.142.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.142.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.142.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.142.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.143.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.143.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.143.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.143.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.143.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.143.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.144.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.144.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.144.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.144.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.144.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.144.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.145.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.145.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.145.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.145.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.145.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.145.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.146.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.146.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.146.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.146.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.146.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.146.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.147.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.147.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.147.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.147.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.147.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.147.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.148.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.148.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.148.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.148.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.148.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.148.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.149.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.149.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.149.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.149.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.149.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.149.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.15.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.15.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.15.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.15.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.15.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.15.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.150.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.150.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.150.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.150.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.150.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.150.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.151.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.151.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.151.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.151.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.151.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.151.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.152.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.152.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.152.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.152.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.152.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.152.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.153.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.153.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.153.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.153.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.153.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.153.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.154.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.154.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.154.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.154.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.154.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.154.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.155.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.155.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.155.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.155.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.155.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.155.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.156.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.156.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.156.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.156.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.156.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.156.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.157.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.157.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.157.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.157.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.157.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.157.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.158.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.158.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.158.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.158.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.158.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.158.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.159.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.159.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.159.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.159.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.159.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.159.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.16.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.16.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.16.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.16.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.16.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.16.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.17.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.17.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.17.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.17.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.17.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.17.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.18.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.18.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.18.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.18.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.18.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.18.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.19.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.19.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.19.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.19.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.19.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.19.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.2.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.2.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.2.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.2.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.2.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.2.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.20.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.20.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.20.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.20.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.20.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.20.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.21.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.21.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.21.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.21.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.21.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.21.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.22.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.22.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.22.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.22.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.22.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.22.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.23.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.23.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.23.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.23.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.23.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.23.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.24.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.24.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.24.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.24.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.24.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.24.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.25.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.25.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.25.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.25.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.25.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.25.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.26.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.26.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.26.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.26.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.26.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.26.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.27.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.27.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.27.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.27.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.27.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.27.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.28.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.28.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.28.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.28.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.28.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.28.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.29.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.29.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.29.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.29.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.29.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.29.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.3.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.3.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.3.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.3.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.3.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.3.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.30.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.30.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.30.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.30.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.30.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.30.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.31.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.31.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.31.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.31.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.31.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.31.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.32.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.32.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.32.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.32.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.32.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.32.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.33.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.33.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.33.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.33.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.33.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.33.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.34.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.34.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.34.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.34.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.34.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.34.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.35.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.35.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.35.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.35.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.35.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.35.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.36.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.36.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.36.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.36.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.36.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.36.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.37.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.37.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.37.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.37.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.37.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.37.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.38.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.38.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.38.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.38.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.38.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.38.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.39.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.39.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.39.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.39.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.39.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.39.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.4.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.4.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.4.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.4.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.4.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.4.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.40.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.40.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.40.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.40.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.40.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.40.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.41.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.41.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.41.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.41.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.41.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.41.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.42.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.42.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.42.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.42.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.42.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.42.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.43.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.43.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.43.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.43.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.43.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.43.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.44.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.44.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.44.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.44.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.44.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.44.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.45.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.45.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.45.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.45.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.45.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.45.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.46.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.46.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.46.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.46.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.46.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.46.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.47.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.47.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.47.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.47.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.47.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.47.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.48.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.48.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.48.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.48.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.48.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.48.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.49.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.49.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.49.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.49.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.49.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.49.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.5.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.5.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.5.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.5.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.5.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.5.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.50.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.50.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.50.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.50.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.50.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.50.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.51.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.51.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.51.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.51.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.51.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.51.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.52.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.52.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.52.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.52.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.52.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.52.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.53.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.53.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.53.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.53.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.53.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.53.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.54.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.54.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.54.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.54.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.54.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.54.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.55.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.55.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.55.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.55.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.55.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.55.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.56.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.56.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.56.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.56.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.56.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.56.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.57.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.57.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.57.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.57.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.57.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.57.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.58.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.58.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.58.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.58.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.58.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.58.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.59.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.59.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.59.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.59.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.59.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.59.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.6.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.6.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.6.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.6.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.6.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.6.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.60.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.60.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.60.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.60.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.60.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.60.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.61.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.61.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.61.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.61.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.61.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.61.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.62.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.62.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.62.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.62.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.62.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.62.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.63.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.63.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.63.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.63.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.63.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.63.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.64.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.64.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.64.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.64.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.64.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.64.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.65.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.65.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.65.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.65.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.65.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.65.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.66.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.66.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.66.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.66.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.66.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.66.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.67.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.67.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.67.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.67.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.67.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.67.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.68.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.68.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.68.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.68.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.68.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.68.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.69.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.69.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.69.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.69.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.69.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.69.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.7.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.7.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.7.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.7.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.7.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.7.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.70.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.70.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.70.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.70.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.70.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.70.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.71.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.71.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.71.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.71.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.71.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.71.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.72.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.72.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.72.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.72.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.72.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.72.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.73.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.73.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.73.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.73.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.73.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.73.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.74.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.74.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.74.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.74.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.74.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.74.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.75.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.75.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.75.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.75.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.75.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.75.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.76.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.76.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.76.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.76.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.76.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.76.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.77.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.77.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.77.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.77.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.77.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.77.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.78.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.78.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.78.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.78.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.78.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.78.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.79.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.79.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.79.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.79.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.79.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.79.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.8.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.8.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.8.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.8.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.8.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.8.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.80.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.80.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.80.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.80.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.80.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.80.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.81.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.81.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.81.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.81.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.81.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.81.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.82.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.82.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.82.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.82.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.82.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.82.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.83.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.83.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.83.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.83.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.83.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.83.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.84.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.84.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.84.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.84.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.84.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.84.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.85.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.85.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.85.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.85.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.85.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.85.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.86.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.86.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.86.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.86.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.86.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.86.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.87.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.87.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.87.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.87.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.87.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.87.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.88.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.88.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.88.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.88.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.88.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.88.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.89.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.89.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.89.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.89.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.89.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.89.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.9.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.9.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.9.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.9.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.9.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.9.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.90.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.90.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.90.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.90.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.90.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.90.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.91.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.91.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.91.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.91.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.91.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.91.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.92.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.92.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.92.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.92.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.92.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.92.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.93.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.93.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.93.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.93.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.93.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.93.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.94.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.94.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.94.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.94.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.94.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.94.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.95.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.95.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.95.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.95.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.95.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.95.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.96.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.96.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.96.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.96.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.96.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.96.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.97.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.97.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.97.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.97.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.97.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.97.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.98.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.98.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.98.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.98.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.98.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.98.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.99.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.99.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.99.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.99.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.99.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.experts.99.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.gate.e_score_correction_bias": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.gate.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.shared_experts.down_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.shared_experts.down_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.shared_experts.gate_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.shared_experts.gate_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.shared_experts.up_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.mlp.shared_experts.up_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.post_attention_layernorm.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.self_attn.k_norm.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.self_attn.k_proj.bias": "model-00064-of-00092.safetensors",
+ "model.layers.63.self_attn.k_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.self_attn.k_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.self_attn.o_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.self_attn.o_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.self_attn.q_norm.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.self_attn.q_proj.bias": "model-00064-of-00092.safetensors",
+ "model.layers.63.self_attn.q_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.self_attn.q_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.63.self_attn.v_proj.bias": "model-00064-of-00092.safetensors",
+ "model.layers.63.self_attn.v_proj.weight": "model-00064-of-00092.safetensors",
+ "model.layers.63.self_attn.v_proj.weight_scale": "model-00064-of-00092.safetensors",
+ "model.layers.64.input_layernorm.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.0.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.0.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.0.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.0.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.0.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.0.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.1.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.1.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.1.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.1.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.1.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.1.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.10.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.10.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.10.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.10.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.10.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.10.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.100.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.100.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.100.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.100.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.100.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.100.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.101.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.101.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.101.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.101.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.101.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.101.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.102.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.102.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.102.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.102.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.102.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.102.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.103.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.103.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.103.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.103.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.103.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.103.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.104.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.104.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.104.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.104.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.104.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.104.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.105.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.105.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.105.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.105.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.105.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.105.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.106.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.106.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.106.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.106.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.106.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.106.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.107.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.107.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.107.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.107.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.107.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.107.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.108.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.108.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.108.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.108.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.108.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.108.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.109.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.109.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.109.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.109.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.109.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.109.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.11.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.11.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.11.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.11.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.11.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.11.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.110.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.110.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.110.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.110.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.110.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.110.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.111.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.111.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.111.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.111.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.111.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.111.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.112.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.112.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.112.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.112.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.112.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.112.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.113.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.113.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.113.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.113.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.113.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.113.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.114.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.114.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.114.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.114.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.114.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.114.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.115.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.115.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.115.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.115.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.115.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.115.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.116.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.116.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.116.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.116.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.116.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.116.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.117.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.117.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.117.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.117.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.117.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.117.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.118.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.118.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.118.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.118.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.118.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.118.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.119.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.119.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.119.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.119.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.119.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.119.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.12.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.12.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.12.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.12.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.12.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.12.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.120.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.120.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.120.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.120.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.120.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.120.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.121.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.121.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.121.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.121.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.121.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.121.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.122.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.122.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.122.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.122.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.122.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.122.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.123.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.123.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.123.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.123.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.123.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.123.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.124.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.124.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.124.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.124.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.124.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.124.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.125.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.125.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.125.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.125.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.125.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.125.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.126.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.126.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.126.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.126.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.126.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.126.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.127.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.127.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.127.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.127.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.127.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.127.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.128.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.128.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.128.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.128.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.128.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.128.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.129.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.129.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.129.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.129.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.129.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.129.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.13.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.13.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.13.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.13.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.13.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.13.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.130.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.130.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.130.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.130.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.130.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.130.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.131.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.131.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.131.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.131.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.131.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.131.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.132.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.132.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.132.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.132.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.132.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.132.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.133.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.133.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.133.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.133.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.133.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.133.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.134.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.134.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.134.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.134.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.134.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.134.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.135.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.135.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.135.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.135.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.135.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.135.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.136.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.136.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.136.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.136.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.136.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.136.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.137.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.137.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.137.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.137.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.137.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.137.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.138.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.138.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.138.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.138.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.138.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.138.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.139.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.139.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.139.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.139.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.139.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.139.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.14.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.14.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.14.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.14.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.14.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.14.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.140.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.140.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.140.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.140.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.140.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.140.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.141.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.141.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.141.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.141.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.141.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.141.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.142.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.142.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.142.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.142.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.142.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.142.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.143.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.143.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.143.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.143.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.143.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.143.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.144.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.144.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.144.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.144.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.144.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.144.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.145.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.145.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.145.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.145.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.145.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.145.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.146.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.146.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.146.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.146.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.146.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.146.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.147.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.147.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.147.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.147.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.147.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.147.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.148.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.148.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.148.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.148.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.148.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.148.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.149.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.149.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.149.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.149.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.149.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.149.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.15.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.15.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.15.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.15.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.15.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.15.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.150.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.150.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.150.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.150.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.150.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.150.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.151.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.151.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.151.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.151.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.151.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.151.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.152.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.152.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.152.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.152.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.152.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.152.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.153.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.153.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.153.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.153.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.153.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.153.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.154.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.154.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.154.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.154.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.154.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.154.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.155.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.155.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.155.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.155.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.155.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.155.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.156.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.156.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.156.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.156.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.156.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.156.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.157.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.157.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.157.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.157.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.157.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.157.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.158.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.158.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.158.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.158.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.158.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.158.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.159.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.159.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.159.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.159.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.159.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.159.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.16.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.16.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.16.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.16.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.16.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.16.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.17.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.17.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.17.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.17.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.17.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.17.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.18.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.18.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.18.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.18.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.18.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.18.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.19.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.19.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.19.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.19.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.19.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.19.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.2.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.2.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.2.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.2.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.2.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.2.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.20.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.20.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.20.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.20.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.20.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.20.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.21.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.21.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.21.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.21.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.21.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.21.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.22.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.22.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.22.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.22.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.22.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.22.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.23.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.23.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.23.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.23.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.23.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.23.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.24.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.24.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.24.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.24.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.24.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.24.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.25.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.25.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.25.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.25.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.25.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.25.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.26.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.26.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.26.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.26.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.26.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.26.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.27.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.27.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.27.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.27.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.27.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.27.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.28.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.28.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.28.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.28.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.28.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.28.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.29.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.29.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.29.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.29.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.29.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.29.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.3.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.3.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.3.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.3.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.3.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.3.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.30.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.30.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.30.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.30.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.30.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.30.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.31.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.31.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.31.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.31.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.31.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.31.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.32.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.32.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.32.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.32.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.32.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.32.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.33.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.33.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.33.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.33.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.33.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.33.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.34.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.34.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.34.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.34.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.34.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.34.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.35.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.35.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.35.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.35.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.35.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.35.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.36.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.36.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.36.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.36.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.36.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.36.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.37.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.37.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.37.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.37.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.37.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.37.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.38.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.38.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.38.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.38.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.38.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.38.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.39.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.39.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.39.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.39.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.39.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.39.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.4.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.4.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.4.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.4.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.4.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.4.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.40.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.40.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.40.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.40.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.40.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.40.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.41.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.41.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.41.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.41.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.41.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.41.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.42.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.42.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.42.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.42.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.42.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.42.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.43.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.43.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.43.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.43.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.43.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.43.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.44.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.44.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.44.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.44.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.44.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.44.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.45.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.45.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.45.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.45.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.45.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.45.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.46.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.46.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.46.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.46.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.46.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.46.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.47.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.47.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.47.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.47.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.47.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.47.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.48.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.48.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.48.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.48.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.48.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.48.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.49.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.49.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.49.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.49.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.49.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.49.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.5.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.5.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.5.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.5.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.5.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.5.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.50.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.50.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.50.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.50.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.50.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.50.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.51.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.51.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.51.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.51.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.51.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.51.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.52.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.52.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.52.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.52.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.52.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.52.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.53.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.53.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.53.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.53.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.53.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.53.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.54.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.54.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.54.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.54.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.54.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.54.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.55.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.55.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.55.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.55.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.55.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.55.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.56.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.56.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.56.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.56.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.56.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.56.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.57.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.57.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.57.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.57.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.57.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.57.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.58.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.58.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.58.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.58.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.58.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.58.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.59.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.59.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.59.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.59.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.59.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.59.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.6.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.6.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.6.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.6.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.6.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.6.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.60.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.60.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.60.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.60.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.60.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.60.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.61.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.61.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.61.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.61.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.61.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.61.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.62.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.62.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.62.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.62.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.62.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.62.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.63.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.63.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.63.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.63.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.63.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.63.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.64.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.64.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.64.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.64.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.64.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.64.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.65.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.65.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.65.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.65.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.65.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.65.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.66.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.66.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.66.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.66.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.66.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.66.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.67.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.67.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.67.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.67.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.67.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.67.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.68.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.68.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.68.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.68.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.68.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.68.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.69.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.69.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.69.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.69.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.69.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.69.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.7.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.7.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.7.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.7.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.7.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.7.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.70.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.70.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.70.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.70.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.70.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.70.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.71.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.71.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.71.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.71.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.71.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.71.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.72.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.72.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.72.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.72.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.72.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.72.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.73.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.73.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.73.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.73.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.73.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.73.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.74.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.74.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.74.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.74.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.74.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.74.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.75.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.75.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.75.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.75.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.75.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.75.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.76.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.76.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.76.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.76.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.76.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.76.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.77.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.77.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.77.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.77.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.77.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.77.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.78.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.78.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.78.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.78.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.78.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.78.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.79.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.79.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.79.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.79.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.79.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.79.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.8.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.8.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.8.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.8.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.8.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.8.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.80.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.80.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.80.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.80.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.80.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.80.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.81.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.81.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.81.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.81.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.81.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.81.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.82.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.82.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.82.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.82.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.82.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.82.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.83.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.83.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.83.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.83.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.83.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.83.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.84.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.84.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.84.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.84.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.84.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.84.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.85.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.85.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.85.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.85.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.85.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.85.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.86.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.86.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.86.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.86.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.86.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.86.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.87.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.87.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.87.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.87.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.87.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.87.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.88.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.88.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.88.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.88.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.88.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.88.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.89.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.89.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.89.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.89.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.89.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.89.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.9.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.9.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.9.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.9.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.9.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.9.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.90.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.90.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.90.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.90.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.90.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.90.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.91.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.91.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.91.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.91.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.91.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.91.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.92.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.92.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.92.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.92.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.92.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.92.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.93.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.93.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.93.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.93.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.93.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.93.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.94.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.94.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.94.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.94.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.94.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.94.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.95.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.95.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.95.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.95.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.95.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.95.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.96.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.96.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.96.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.96.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.96.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.96.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.97.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.97.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.97.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.97.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.97.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.97.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.98.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.98.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.98.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.98.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.98.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.98.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.99.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.99.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.99.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.99.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.99.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.experts.99.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.gate.e_score_correction_bias": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.gate.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.shared_experts.down_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.shared_experts.down_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.shared_experts.gate_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.shared_experts.gate_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.shared_experts.up_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.mlp.shared_experts.up_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.post_attention_layernorm.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.self_attn.k_norm.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.self_attn.k_proj.bias": "model-00065-of-00092.safetensors",
+ "model.layers.64.self_attn.k_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.self_attn.k_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.self_attn.o_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.self_attn.o_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.self_attn.q_norm.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.self_attn.q_proj.bias": "model-00065-of-00092.safetensors",
+ "model.layers.64.self_attn.q_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.self_attn.q_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.64.self_attn.v_proj.bias": "model-00065-of-00092.safetensors",
+ "model.layers.64.self_attn.v_proj.weight": "model-00065-of-00092.safetensors",
+ "model.layers.64.self_attn.v_proj.weight_scale": "model-00065-of-00092.safetensors",
+ "model.layers.65.input_layernorm.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.0.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.0.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.0.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.0.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.0.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.0.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.1.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.1.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.1.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.1.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.1.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.1.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.10.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.10.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.10.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.10.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.10.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.10.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.100.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.100.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.100.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.100.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.100.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.100.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.101.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.101.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.101.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.101.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.101.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.101.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.102.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.102.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.102.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.102.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.102.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.102.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.103.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.103.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.103.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.103.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.103.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.103.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.104.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.104.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.104.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.104.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.104.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.104.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.105.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.105.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.105.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.105.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.105.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.105.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.106.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.106.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.106.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.106.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.106.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.106.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.107.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.107.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.107.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.107.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.107.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.107.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.108.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.108.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.108.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.108.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.108.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.108.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.109.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.109.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.109.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.109.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.109.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.109.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.11.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.11.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.11.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.11.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.11.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.11.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.110.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.110.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.110.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.110.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.110.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.110.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.111.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.111.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.111.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.111.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.111.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.111.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.112.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.112.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.112.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.112.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.112.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.112.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.113.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.113.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.113.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.113.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.113.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.113.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.114.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.114.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.114.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.114.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.114.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.114.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.115.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.115.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.115.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.115.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.115.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.115.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.116.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.116.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.116.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.116.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.116.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.116.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.117.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.117.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.117.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.117.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.117.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.117.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.118.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.118.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.118.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.118.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.118.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.118.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.119.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.119.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.119.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.119.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.119.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.119.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.12.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.12.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.12.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.12.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.12.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.12.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.120.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.120.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.120.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.120.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.120.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.120.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.121.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.121.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.121.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.121.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.121.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.121.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.122.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.122.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.122.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.122.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.122.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.122.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.123.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.123.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.123.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.123.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.123.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.123.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.124.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.124.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.124.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.124.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.124.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.124.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.125.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.125.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.125.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.125.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.125.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.125.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.126.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.126.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.126.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.126.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.126.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.126.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.127.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.127.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.127.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.127.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.127.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.127.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.128.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.128.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.128.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.128.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.128.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.128.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.129.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.129.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.129.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.129.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.129.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.129.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.13.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.13.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.13.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.13.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.13.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.13.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.130.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.130.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.130.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.130.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.130.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.130.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.131.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.131.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.131.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.131.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.131.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.131.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.132.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.132.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.132.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.132.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.132.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.132.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.133.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.133.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.133.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.133.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.133.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.133.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.134.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.134.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.134.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.134.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.134.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.134.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.135.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.135.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.135.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.135.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.135.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.135.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.136.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.136.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.136.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.136.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.136.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.136.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.137.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.137.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.137.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.137.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.137.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.137.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.138.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.138.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.138.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.138.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.138.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.138.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.139.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.139.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.139.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.139.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.139.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.139.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.14.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.14.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.14.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.14.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.14.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.14.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.140.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.140.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.140.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.140.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.140.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.140.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.141.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.141.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.141.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.141.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.141.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.141.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.142.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.142.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.142.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.142.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.142.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.142.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.143.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.143.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.143.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.143.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.143.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.143.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.144.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.144.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.144.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.144.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.144.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.144.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.145.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.145.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.145.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.145.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.145.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.145.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.146.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.146.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.146.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.146.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.146.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.146.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.147.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.147.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.147.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.147.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.147.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.147.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.148.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.148.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.148.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.148.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.148.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.148.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.149.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.149.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.149.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.149.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.149.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.149.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.15.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.15.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.15.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.15.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.15.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.15.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.150.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.150.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.150.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.150.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.150.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.150.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.151.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.151.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.151.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.151.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.151.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.151.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.152.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.152.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.152.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.152.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.152.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.152.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.153.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.153.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.153.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.153.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.153.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.153.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.154.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.154.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.154.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.154.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.154.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.154.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.155.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.155.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.155.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.155.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.155.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.155.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.156.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.156.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.156.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.156.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.156.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.156.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.157.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.157.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.157.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.157.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.157.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.157.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.158.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.158.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.158.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.158.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.158.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.158.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.159.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.159.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.159.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.159.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.159.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.159.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.16.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.16.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.16.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.16.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.16.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.16.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.17.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.17.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.17.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.17.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.17.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.17.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.18.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.18.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.18.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.18.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.18.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.18.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.19.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.19.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.19.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.19.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.19.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.19.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.2.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.2.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.2.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.2.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.2.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.2.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.20.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.20.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.20.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.20.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.20.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.20.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.21.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.21.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.21.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.21.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.21.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.21.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.22.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.22.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.22.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.22.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.22.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.22.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.23.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.23.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.23.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.23.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.23.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.23.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.24.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.24.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.24.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.24.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.24.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.24.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.25.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.25.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.25.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.25.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.25.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.25.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.26.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.26.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.26.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.26.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.26.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.26.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.27.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.27.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.27.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.27.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.27.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.27.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.28.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.28.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.28.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.28.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.28.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.28.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.29.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.29.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.29.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.29.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.29.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.29.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.3.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.3.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.3.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.3.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.3.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.3.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.30.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.30.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.30.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.30.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.30.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.30.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.31.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.31.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.31.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.31.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.31.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.31.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.32.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.32.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.32.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.32.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.32.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.32.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.33.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.33.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.33.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.33.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.33.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.33.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.34.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.34.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.34.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.34.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.34.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.34.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.35.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.35.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.35.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.35.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.35.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.35.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.36.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.36.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.36.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.36.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.36.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.36.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.37.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.37.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.37.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.37.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.37.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.37.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.38.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.38.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.38.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.38.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.38.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.38.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.39.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.39.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.39.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.39.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.39.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.39.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.4.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.4.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.4.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.4.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.4.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.4.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.40.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.40.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.40.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.40.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.40.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.40.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.41.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.41.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.41.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.41.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.41.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.41.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.42.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.42.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.42.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.42.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.42.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.42.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.43.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.43.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.43.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.43.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.43.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.43.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.44.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.44.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.44.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.44.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.44.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.44.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.45.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.45.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.45.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.45.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.45.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.45.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.46.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.46.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.46.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.46.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.46.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.46.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.47.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.47.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.47.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.47.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.47.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.47.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.48.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.48.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.48.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.48.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.48.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.48.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.49.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.49.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.49.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.49.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.49.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.49.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.5.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.5.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.5.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.5.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.5.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.5.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.50.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.50.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.50.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.50.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.50.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.50.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.51.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.51.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.51.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.51.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.51.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.51.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.52.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.52.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.52.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.52.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.52.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.52.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.53.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.53.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.53.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.53.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.53.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.53.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.54.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.54.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.54.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.54.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.54.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.54.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.55.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.55.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.55.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.55.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.55.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.55.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.56.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.56.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.56.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.56.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.56.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.56.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.57.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.57.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.57.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.57.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.57.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.57.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.58.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.58.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.58.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.58.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.58.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.58.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.59.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.59.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.59.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.59.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.59.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.59.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.6.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.6.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.6.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.6.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.6.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.6.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.60.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.60.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.60.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.60.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.60.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.60.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.61.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.61.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.61.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.61.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.61.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.61.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.62.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.62.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.62.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.62.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.62.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.62.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.63.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.63.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.63.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.63.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.63.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.63.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.64.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.64.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.64.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.64.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.64.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.64.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.65.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.65.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.65.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.65.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.65.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.65.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.66.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.66.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.66.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.66.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.66.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.66.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.67.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.67.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.67.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.67.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.67.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.67.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.68.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.68.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.68.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.68.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.68.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.68.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.69.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.69.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.69.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.69.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.69.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.69.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.7.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.7.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.7.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.7.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.7.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.7.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.70.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.70.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.70.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.70.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.70.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.70.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.71.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.71.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.71.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.71.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.71.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.71.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.72.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.72.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.72.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.72.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.72.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.72.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.73.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.73.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.73.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.73.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.73.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.73.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.74.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.74.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.74.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.74.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.74.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.74.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.75.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.75.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.75.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.75.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.75.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.75.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.76.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.76.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.76.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.76.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.76.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.76.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.77.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.77.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.77.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.77.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.77.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.77.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.78.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.78.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.78.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.78.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.78.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.78.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.79.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.79.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.79.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.79.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.79.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.79.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.8.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.8.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.8.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.8.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.8.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.8.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.80.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.80.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.80.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.80.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.80.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.80.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.81.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.81.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.81.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.81.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.81.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.81.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.82.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.82.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.82.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.82.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.82.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.82.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.83.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.83.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.83.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.83.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.83.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.83.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.84.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.84.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.84.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.84.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.84.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.84.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.85.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.85.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.85.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.85.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.85.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.85.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.86.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.86.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.86.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.86.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.86.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.86.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.87.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.87.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.87.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.87.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.87.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.87.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.88.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.88.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.88.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.88.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.88.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.88.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.89.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.89.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.89.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.89.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.89.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.89.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.9.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.9.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.9.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.9.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.9.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.9.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.90.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.90.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.90.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.90.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.90.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.90.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.91.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.91.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.91.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.91.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.91.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.91.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.92.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.92.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.92.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.92.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.92.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.92.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.93.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.93.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.93.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.93.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.93.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.93.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.94.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.94.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.94.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.94.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.94.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.94.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.95.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.95.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.95.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.95.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.95.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.95.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.96.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.96.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.96.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.96.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.96.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.96.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.97.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.97.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.97.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.97.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.97.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.97.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.98.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.98.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.98.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.98.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.98.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.98.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.99.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.99.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.99.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.99.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.99.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.experts.99.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.gate.e_score_correction_bias": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.gate.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.shared_experts.down_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.shared_experts.down_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.shared_experts.gate_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.shared_experts.gate_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.shared_experts.up_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.mlp.shared_experts.up_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.post_attention_layernorm.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.self_attn.k_norm.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.self_attn.k_proj.bias": "model-00066-of-00092.safetensors",
+ "model.layers.65.self_attn.k_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.self_attn.k_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.self_attn.o_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.self_attn.o_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.self_attn.q_norm.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.self_attn.q_proj.bias": "model-00066-of-00092.safetensors",
+ "model.layers.65.self_attn.q_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.self_attn.q_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.65.self_attn.v_proj.bias": "model-00066-of-00092.safetensors",
+ "model.layers.65.self_attn.v_proj.weight": "model-00066-of-00092.safetensors",
+ "model.layers.65.self_attn.v_proj.weight_scale": "model-00066-of-00092.safetensors",
+ "model.layers.66.input_layernorm.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.0.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.0.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.0.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.0.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.0.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.0.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.1.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.1.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.1.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.1.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.1.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.1.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.10.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.10.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.10.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.10.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.10.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.10.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.100.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.100.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.100.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.100.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.100.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.100.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.101.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.101.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.101.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.101.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.101.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.101.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.102.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.102.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.102.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.102.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.102.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.102.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.103.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.103.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.103.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.103.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.103.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.103.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.104.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.104.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.104.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.104.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.104.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.104.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.105.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.105.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.105.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.105.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.105.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.105.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.106.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.106.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.106.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.106.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.106.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.106.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.107.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.107.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.107.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.107.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.107.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.107.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.108.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.108.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.108.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.108.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.108.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.108.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.109.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.109.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.109.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.109.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.109.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.109.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.11.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.11.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.11.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.11.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.11.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.11.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.110.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.110.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.110.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.110.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.110.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.110.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.111.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.111.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.111.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.111.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.111.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.111.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.112.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.112.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.112.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.112.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.112.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.112.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.113.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.113.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.113.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.113.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.113.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.113.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.114.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.114.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.114.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.114.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.114.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.114.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.115.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.115.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.115.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.115.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.115.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.115.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.116.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.116.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.116.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.116.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.116.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.116.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.117.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.117.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.117.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.117.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.117.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.117.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.118.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.118.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.118.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.118.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.118.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.118.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.119.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.119.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.119.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.119.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.119.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.119.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.12.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.12.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.12.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.12.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.12.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.12.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.120.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.120.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.120.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.120.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.120.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.120.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.121.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.121.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.121.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.121.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.121.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.121.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.122.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.122.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.122.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.122.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.122.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.122.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.123.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.123.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.123.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.123.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.123.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.123.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.124.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.124.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.124.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.124.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.124.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.124.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.125.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.125.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.125.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.125.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.125.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.125.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.126.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.126.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.126.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.126.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.126.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.126.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.127.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.127.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.127.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.127.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.127.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.127.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.128.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.128.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.128.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.128.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.128.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.128.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.129.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.129.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.129.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.129.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.129.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.129.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.13.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.13.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.13.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.13.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.13.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.13.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.130.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.130.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.130.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.130.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.130.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.130.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.131.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.131.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.131.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.131.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.131.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.131.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.132.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.132.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.132.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.132.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.132.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.132.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.133.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.133.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.133.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.133.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.133.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.133.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.134.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.134.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.134.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.134.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.134.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.134.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.135.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.135.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.135.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.135.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.135.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.135.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.136.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.136.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.136.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.136.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.136.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.136.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.137.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.137.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.137.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.137.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.137.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.137.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.138.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.138.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.138.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.138.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.138.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.138.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.139.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.139.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.139.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.139.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.139.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.139.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.14.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.14.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.14.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.14.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.14.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.14.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.140.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.140.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.140.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.140.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.140.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.140.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.141.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.141.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.141.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.141.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.141.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.141.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.142.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.142.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.142.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.142.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.142.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.142.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.143.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.143.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.143.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.143.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.143.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.143.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.144.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.144.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.144.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.144.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.144.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.144.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.145.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.145.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.145.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.145.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.145.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.145.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.146.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.146.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.146.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.146.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.146.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.146.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.147.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.147.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.147.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.147.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.147.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.147.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.148.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.148.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.148.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.148.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.148.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.148.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.149.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.149.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.149.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.149.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.149.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.149.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.15.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.15.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.15.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.15.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.15.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.15.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.150.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.150.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.150.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.150.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.150.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.150.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.151.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.151.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.151.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.151.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.151.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.151.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.152.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.152.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.152.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.152.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.152.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.152.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.153.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.153.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.153.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.153.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.153.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.153.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.154.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.154.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.154.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.154.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.154.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.154.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.155.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.155.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.155.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.155.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.155.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.155.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.156.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.156.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.156.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.156.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.156.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.156.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.157.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.157.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.157.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.157.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.157.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.157.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.158.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.158.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.158.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.158.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.158.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.158.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.159.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.159.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.159.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.159.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.159.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.159.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.16.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.16.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.16.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.16.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.16.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.16.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.17.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.17.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.17.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.17.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.17.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.17.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.18.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.18.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.18.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.18.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.18.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.18.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.19.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.19.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.19.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.19.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.19.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.19.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.2.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.2.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.2.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.2.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.2.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.2.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.20.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.20.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.20.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.20.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.20.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.20.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.21.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.21.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.21.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.21.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.21.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.21.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.22.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.22.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.22.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.22.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.22.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.22.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.23.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.23.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.23.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.23.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.23.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.23.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.24.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.24.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.24.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.24.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.24.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.24.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.25.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.25.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.25.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.25.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.25.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.25.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.26.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.26.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.26.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.26.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.26.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.26.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.27.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.27.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.27.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.27.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.27.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.27.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.28.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.28.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.28.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.28.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.28.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.28.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.29.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.29.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.29.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.29.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.29.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.29.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.3.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.3.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.3.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.3.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.3.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.3.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.30.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.30.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.30.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.30.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.30.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.30.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.31.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.31.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.31.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.31.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.31.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.31.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.32.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.32.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.32.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.32.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.32.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.32.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.33.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.33.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.33.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.33.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.33.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.33.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.34.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.34.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.34.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.34.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.34.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.34.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.35.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.35.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.35.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.35.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.35.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.35.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.36.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.36.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.36.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.36.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.36.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.36.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.37.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.37.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.37.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.37.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.37.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.37.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.38.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.38.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.38.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.38.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.38.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.38.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.39.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.39.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.39.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.39.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.39.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.39.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.4.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.4.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.4.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.4.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.4.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.4.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.40.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.40.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.40.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.40.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.40.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.40.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.41.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.41.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.41.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.41.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.41.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.41.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.42.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.42.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.42.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.42.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.42.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.42.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.43.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.43.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.43.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.43.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.43.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.43.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.44.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.44.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.44.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.44.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.44.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.44.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.45.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.45.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.45.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.45.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.45.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.45.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.46.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.46.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.46.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.46.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.46.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.46.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.47.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.47.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.47.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.47.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.47.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.47.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.48.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.48.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.48.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.48.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.48.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.48.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.49.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.49.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.49.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.49.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.49.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.49.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.5.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.5.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.5.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.5.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.5.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.5.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.50.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.50.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.50.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.50.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.50.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.50.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.51.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.51.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.51.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.51.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.51.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.51.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.52.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.52.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.52.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.52.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.52.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.52.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.53.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.53.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.53.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.53.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.53.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.53.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.54.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.54.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.54.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.54.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.54.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.54.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.55.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.55.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.55.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.55.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.55.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.55.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.56.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.56.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.56.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.56.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.56.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.56.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.57.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.57.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.57.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.57.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.57.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.57.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.58.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.58.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.58.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.58.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.58.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.58.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.59.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.59.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.59.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.59.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.59.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.59.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.6.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.6.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.6.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.6.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.6.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.6.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.60.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.60.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.60.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.60.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.60.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.60.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.61.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.61.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.61.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.61.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.61.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.61.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.62.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.62.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.62.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.62.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.62.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.62.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.63.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.63.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.63.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.63.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.63.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.63.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.64.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.64.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.64.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.64.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.64.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.64.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.65.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.65.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.65.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.65.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.65.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.65.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.66.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.66.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.66.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.66.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.66.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.66.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.67.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.67.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.67.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.67.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.67.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.67.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.68.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.68.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.68.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.68.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.68.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.68.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.69.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.69.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.69.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.69.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.69.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.69.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.7.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.7.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.7.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.7.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.7.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.7.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.70.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.70.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.70.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.70.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.70.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.70.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.71.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.71.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.71.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.71.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.71.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.71.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.72.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.72.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.72.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.72.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.72.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.72.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.73.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.73.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.73.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.73.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.73.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.73.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.74.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.74.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.74.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.74.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.74.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.74.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.75.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.75.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.75.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.75.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.75.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.75.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.76.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.76.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.76.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.76.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.76.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.76.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.77.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.77.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.77.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.77.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.77.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.77.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.78.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.78.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.78.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.78.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.78.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.78.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.79.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.79.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.79.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.79.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.79.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.79.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.8.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.8.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.8.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.8.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.8.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.8.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.80.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.80.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.80.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.80.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.80.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.80.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.81.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.81.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.81.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.81.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.81.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.81.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.82.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.82.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.82.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.82.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.82.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.82.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.83.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.83.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.83.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.83.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.83.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.83.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.84.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.84.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.84.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.84.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.84.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.84.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.85.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.85.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.85.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.85.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.85.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.85.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.86.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.86.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.86.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.86.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.86.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.86.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.87.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.87.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.87.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.87.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.87.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.87.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.88.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.88.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.88.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.88.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.88.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.88.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.89.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.89.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.89.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.89.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.89.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.89.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.9.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.9.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.9.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.9.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.9.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.9.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.90.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.90.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.90.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.90.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.90.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.90.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.91.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.91.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.91.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.91.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.91.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.91.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.92.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.92.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.92.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.92.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.92.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.92.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.93.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.93.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.93.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.93.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.93.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.93.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.94.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.94.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.94.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.94.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.94.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.94.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.95.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.95.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.95.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.95.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.95.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.95.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.96.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.96.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.96.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.96.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.96.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.96.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.97.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.97.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.97.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.97.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.97.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.97.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.98.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.98.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.98.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.98.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.98.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.98.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.99.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.99.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.99.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.99.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.99.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.experts.99.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.gate.e_score_correction_bias": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.gate.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.shared_experts.down_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.shared_experts.down_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.shared_experts.gate_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.shared_experts.gate_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.shared_experts.up_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.mlp.shared_experts.up_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.post_attention_layernorm.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.self_attn.k_norm.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.self_attn.k_proj.bias": "model-00067-of-00092.safetensors",
+ "model.layers.66.self_attn.k_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.self_attn.k_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.self_attn.o_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.self_attn.o_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.self_attn.q_norm.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.self_attn.q_proj.bias": "model-00067-of-00092.safetensors",
+ "model.layers.66.self_attn.q_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.self_attn.q_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.66.self_attn.v_proj.bias": "model-00067-of-00092.safetensors",
+ "model.layers.66.self_attn.v_proj.weight": "model-00067-of-00092.safetensors",
+ "model.layers.66.self_attn.v_proj.weight_scale": "model-00067-of-00092.safetensors",
+ "model.layers.67.input_layernorm.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.0.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.0.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.0.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.0.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.0.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.0.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.1.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.1.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.1.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.1.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.1.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.1.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.10.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.10.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.10.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.10.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.10.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.10.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.100.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.100.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.100.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.100.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.100.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.100.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.101.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.101.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.101.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.101.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.101.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.101.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.102.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.102.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.102.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.102.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.102.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.102.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.103.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.103.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.103.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.103.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.103.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.103.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.104.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.104.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.104.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.104.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.104.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.104.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.105.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.105.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.105.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.105.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.105.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.105.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.106.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.106.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.106.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.106.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.106.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.106.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.107.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.107.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.107.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.107.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.107.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.107.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.108.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.108.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.108.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.108.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.108.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.108.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.109.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.109.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.109.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.109.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.109.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.109.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.11.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.11.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.11.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.11.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.11.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.11.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.110.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.110.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.110.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.110.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.110.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.110.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.111.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.111.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.111.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.111.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.111.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.111.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.112.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.112.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.112.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.112.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.112.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.112.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.113.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.113.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.113.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.113.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.113.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.113.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.114.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.114.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.114.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.114.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.114.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.114.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.115.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.115.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.115.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.115.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.115.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.115.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.116.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.116.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.116.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.116.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.116.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.116.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.117.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.117.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.117.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.117.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.117.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.117.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.118.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.118.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.118.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.118.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.118.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.118.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.119.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.119.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.119.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.119.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.119.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.119.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.12.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.12.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.12.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.12.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.12.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.12.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.120.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.120.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.120.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.120.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.120.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.120.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.121.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.121.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.121.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.121.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.121.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.121.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.122.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.122.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.122.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.122.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.122.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.122.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.123.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.123.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.123.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.123.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.123.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.123.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.124.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.124.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.124.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.124.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.124.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.124.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.125.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.125.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.125.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.125.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.125.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.125.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.126.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.126.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.126.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.126.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.126.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.126.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.127.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.127.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.127.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.127.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.127.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.127.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.128.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.128.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.128.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.128.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.128.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.128.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.129.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.129.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.129.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.129.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.129.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.129.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.13.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.13.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.13.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.13.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.13.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.13.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.130.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.130.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.130.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.130.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.130.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.130.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.131.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.131.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.131.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.131.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.131.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.131.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.132.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.132.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.132.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.132.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.132.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.132.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.133.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.133.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.133.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.133.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.133.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.133.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.134.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.134.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.134.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.134.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.134.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.134.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.135.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.135.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.135.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.135.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.135.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.135.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.136.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.136.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.136.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.136.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.136.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.136.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.137.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.137.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.137.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.137.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.137.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.137.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.138.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.138.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.138.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.138.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.138.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.138.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.139.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.139.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.139.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.139.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.139.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.139.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.14.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.14.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.14.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.14.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.14.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.14.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.140.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.140.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.140.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.140.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.140.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.140.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.141.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.141.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.141.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.141.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.141.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.141.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.142.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.142.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.142.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.142.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.142.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.142.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.143.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.143.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.143.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.143.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.143.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.143.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.144.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.144.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.144.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.144.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.144.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.144.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.145.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.145.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.145.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.145.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.145.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.145.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.146.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.146.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.146.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.146.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.146.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.146.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.147.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.147.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.147.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.147.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.147.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.147.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.148.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.148.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.148.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.148.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.148.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.148.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.149.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.149.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.149.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.149.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.149.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.149.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.15.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.15.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.15.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.15.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.15.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.15.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.150.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.150.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.150.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.150.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.150.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.150.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.151.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.151.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.151.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.151.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.151.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.151.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.152.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.152.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.152.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.152.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.152.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.152.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.153.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.153.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.153.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.153.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.153.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.153.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.154.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.154.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.154.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.154.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.154.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.154.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.155.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.155.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.155.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.155.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.155.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.155.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.156.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.156.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.156.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.156.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.156.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.156.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.157.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.157.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.157.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.157.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.157.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.157.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.158.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.158.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.158.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.158.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.158.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.158.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.159.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.159.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.159.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.159.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.159.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.159.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.16.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.16.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.16.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.16.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.16.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.16.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.17.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.17.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.17.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.17.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.17.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.17.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.18.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.18.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.18.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.18.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.18.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.18.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.19.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.19.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.19.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.19.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.19.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.19.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.2.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.2.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.2.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.2.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.2.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.2.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.20.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.20.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.20.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.20.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.20.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.20.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.21.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.21.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.21.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.21.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.21.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.21.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.22.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.22.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.22.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.22.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.22.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.22.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.23.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.23.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.23.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.23.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.23.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.23.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.24.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.24.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.24.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.24.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.24.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.24.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.25.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.25.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.25.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.25.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.25.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.25.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.26.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.26.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.26.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.26.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.26.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.26.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.27.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.27.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.27.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.27.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.27.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.27.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.28.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.28.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.28.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.28.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.28.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.28.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.29.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.29.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.29.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.29.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.29.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.29.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.3.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.3.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.3.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.3.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.3.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.3.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.30.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.30.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.30.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.30.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.30.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.30.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.31.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.31.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.31.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.31.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.31.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.31.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.32.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.32.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.32.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.32.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.32.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.32.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.33.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.33.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.33.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.33.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.33.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.33.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.34.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.34.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.34.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.34.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.34.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.34.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.35.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.35.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.35.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.35.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.35.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.35.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.36.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.36.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.36.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.36.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.36.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.36.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.37.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.37.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.37.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.37.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.37.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.37.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.38.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.38.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.38.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.38.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.38.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.38.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.39.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.39.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.39.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.39.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.39.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.39.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.4.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.4.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.4.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.4.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.4.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.4.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.40.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.40.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.40.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.40.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.40.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.40.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.41.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.41.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.41.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.41.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.41.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.41.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.42.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.42.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.42.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.42.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.42.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.42.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.43.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.43.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.43.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.43.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.43.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.43.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.44.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.44.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.44.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.44.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.44.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.44.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.45.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.45.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.45.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.45.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.45.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.45.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.46.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.46.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.46.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.46.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.46.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.46.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.47.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.47.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.47.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.47.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.47.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.47.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.48.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.48.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.48.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.48.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.48.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.48.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.49.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.49.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.49.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.49.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.49.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.49.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.5.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.5.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.5.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.5.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.5.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.5.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.50.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.50.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.50.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.50.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.50.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.50.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.51.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.51.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.51.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.51.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.51.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.51.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.52.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.52.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.52.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.52.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.52.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.52.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.53.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.53.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.53.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.53.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.53.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.53.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.54.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.54.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.54.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.54.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.54.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.54.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.55.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.55.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.55.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.55.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.55.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.55.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.56.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.56.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.56.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.56.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.56.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.56.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.57.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.57.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.57.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.57.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.57.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.57.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.58.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.58.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.58.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.58.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.58.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.58.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.59.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.59.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.59.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.59.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.59.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.59.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.6.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.6.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.6.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.6.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.6.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.6.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.60.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.60.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.60.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.60.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.60.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.60.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.61.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.61.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.61.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.61.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.61.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.61.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.62.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.62.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.62.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.62.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.62.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.62.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.63.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.63.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.63.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.63.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.63.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.63.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.64.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.64.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.64.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.64.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.64.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.64.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.65.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.65.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.65.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.65.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.65.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.65.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.66.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.66.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.66.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.66.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.66.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.66.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.67.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.67.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.67.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.67.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.67.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.67.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.68.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.68.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.68.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.68.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.68.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.68.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.69.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.69.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.69.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.69.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.69.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.69.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.7.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.7.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.7.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.7.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.7.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.7.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.70.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.70.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.70.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.70.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.70.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.70.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.71.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.71.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.71.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.71.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.71.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.71.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.72.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.72.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.72.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.72.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.72.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.72.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.73.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.73.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.73.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.73.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.73.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.73.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.74.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.74.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.74.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.74.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.74.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.74.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.75.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.75.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.75.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.75.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.75.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.75.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.76.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.76.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.76.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.76.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.76.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.76.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.77.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.77.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.77.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.77.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.77.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.77.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.78.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.78.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.78.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.78.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.78.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.78.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.79.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.79.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.79.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.79.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.79.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.79.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.8.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.8.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.8.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.8.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.8.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.8.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.80.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.80.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.80.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.80.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.80.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.80.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.81.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.81.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.81.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.81.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.81.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.81.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.82.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.82.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.82.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.82.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.82.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.82.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.83.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.83.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.83.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.83.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.83.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.83.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.84.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.84.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.84.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.84.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.84.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.84.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.85.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.85.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.85.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.85.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.85.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.85.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.86.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.86.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.86.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.86.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.86.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.86.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.87.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.87.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.87.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.87.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.87.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.87.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.88.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.88.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.88.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.88.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.88.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.88.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.89.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.89.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.89.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.89.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.89.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.89.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.9.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.9.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.9.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.9.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.9.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.9.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.90.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.90.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.90.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.90.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.90.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.90.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.91.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.91.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.91.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.91.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.91.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.91.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.92.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.92.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.92.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.92.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.92.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.92.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.93.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.93.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.93.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.93.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.93.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.93.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.94.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.94.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.94.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.94.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.94.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.94.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.95.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.95.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.95.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.95.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.95.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.95.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.96.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.96.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.96.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.96.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.96.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.96.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.97.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.97.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.97.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.97.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.97.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.97.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.98.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.98.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.98.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.98.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.98.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.98.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.99.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.99.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.99.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.99.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.99.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.experts.99.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.gate.e_score_correction_bias": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.gate.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.shared_experts.down_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.shared_experts.down_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.shared_experts.gate_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.shared_experts.gate_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.shared_experts.up_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.mlp.shared_experts.up_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.post_attention_layernorm.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.self_attn.k_norm.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.self_attn.k_proj.bias": "model-00068-of-00092.safetensors",
+ "model.layers.67.self_attn.k_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.self_attn.k_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.self_attn.o_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.self_attn.o_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.self_attn.q_norm.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.self_attn.q_proj.bias": "model-00068-of-00092.safetensors",
+ "model.layers.67.self_attn.q_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.self_attn.q_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.67.self_attn.v_proj.bias": "model-00068-of-00092.safetensors",
+ "model.layers.67.self_attn.v_proj.weight": "model-00068-of-00092.safetensors",
+ "model.layers.67.self_attn.v_proj.weight_scale": "model-00068-of-00092.safetensors",
+ "model.layers.68.input_layernorm.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.0.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.0.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.0.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.0.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.0.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.0.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.1.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.1.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.1.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.1.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.1.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.1.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.10.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.10.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.10.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.10.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.10.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.10.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.100.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.100.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.100.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.100.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.100.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.100.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.101.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.101.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.101.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.101.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.101.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.101.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.102.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.102.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.102.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.102.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.102.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.102.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.103.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.103.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.103.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.103.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.103.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.103.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.104.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.104.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.104.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.104.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.104.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.104.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.105.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.105.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.105.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.105.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.105.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.105.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.106.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.106.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.106.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.106.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.106.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.106.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.107.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.107.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.107.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.107.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.107.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.107.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.108.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.108.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.108.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.108.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.108.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.108.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.109.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.109.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.109.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.109.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.109.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.109.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.11.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.11.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.11.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.11.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.11.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.11.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.110.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.110.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.110.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.110.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.110.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.110.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.111.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.111.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.111.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.111.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.111.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.111.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.112.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.112.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.112.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.112.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.112.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.112.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.113.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.113.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.113.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.113.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.113.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.113.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.114.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.114.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.114.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.114.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.114.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.114.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.115.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.115.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.115.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.115.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.115.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.115.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.116.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.116.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.116.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.116.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.116.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.116.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.117.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.117.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.117.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.117.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.117.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.117.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.118.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.118.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.118.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.118.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.118.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.118.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.119.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.119.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.119.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.119.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.119.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.119.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.12.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.12.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.12.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.12.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.12.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.12.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.120.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.120.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.120.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.120.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.120.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.120.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.121.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.121.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.121.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.121.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.121.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.121.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.122.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.122.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.122.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.122.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.122.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.122.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.123.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.123.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.123.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.123.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.123.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.123.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.124.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.124.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.124.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.124.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.124.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.124.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.125.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.125.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.125.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.125.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.125.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.125.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.126.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.126.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.126.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.126.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.126.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.126.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.127.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.127.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.127.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.127.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.127.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.127.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.128.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.128.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.128.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.128.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.128.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.128.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.129.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.129.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.129.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.129.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.129.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.129.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.13.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.13.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.13.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.13.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.13.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.13.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.130.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.130.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.130.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.130.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.130.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.130.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.131.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.131.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.131.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.131.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.131.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.131.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.132.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.132.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.132.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.132.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.132.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.132.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.133.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.133.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.133.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.133.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.133.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.133.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.134.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.134.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.134.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.134.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.134.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.134.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.135.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.135.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.135.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.135.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.135.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.135.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.136.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.136.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.136.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.136.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.136.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.136.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.137.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.137.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.137.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.137.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.137.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.137.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.138.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.138.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.138.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.138.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.138.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.138.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.139.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.139.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.139.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.139.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.139.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.139.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.14.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.14.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.14.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.14.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.14.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.14.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.140.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.140.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.140.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.140.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.140.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.140.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.141.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.141.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.141.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.141.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.141.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.141.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.142.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.142.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.142.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.142.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.142.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.142.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.143.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.143.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.143.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.143.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.143.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.143.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.144.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.144.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.144.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.144.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.144.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.144.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.145.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.145.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.145.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.145.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.145.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.145.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.146.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.146.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.146.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.146.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.146.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.146.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.147.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.147.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.147.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.147.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.147.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.147.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.148.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.148.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.148.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.148.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.148.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.148.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.149.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.149.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.149.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.149.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.149.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.149.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.15.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.15.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.15.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.15.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.15.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.15.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.150.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.150.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.150.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.150.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.150.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.150.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.151.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.151.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.151.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.151.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.151.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.151.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.152.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.152.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.152.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.152.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.152.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.152.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.153.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.153.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.153.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.153.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.153.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.153.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.154.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.154.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.154.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.154.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.154.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.154.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.155.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.155.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.155.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.155.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.155.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.155.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.156.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.156.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.156.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.156.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.156.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.156.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.157.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.157.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.157.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.157.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.157.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.157.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.158.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.158.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.158.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.158.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.158.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.158.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.159.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.159.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.159.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.159.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.159.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.159.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.16.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.16.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.16.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.16.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.16.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.16.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.17.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.17.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.17.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.17.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.17.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.17.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.18.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.18.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.18.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.18.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.18.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.18.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.19.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.19.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.19.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.19.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.19.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.19.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.2.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.2.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.2.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.2.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.2.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.2.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.20.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.20.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.20.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.20.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.20.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.20.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.21.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.21.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.21.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.21.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.21.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.21.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.22.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.22.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.22.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.22.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.22.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.22.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.23.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.23.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.23.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.23.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.23.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.23.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.24.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.24.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.24.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.24.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.24.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.24.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.25.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.25.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.25.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.25.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.25.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.25.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.26.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.26.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.26.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.26.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.26.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.26.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.27.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.27.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.27.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.27.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.27.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.27.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.28.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.28.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.28.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.28.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.28.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.28.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.29.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.29.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.29.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.29.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.29.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.29.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.3.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.3.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.3.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.3.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.3.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.3.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.30.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.30.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.30.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.30.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.30.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.30.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.31.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.31.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.31.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.31.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.31.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.31.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.32.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.32.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.32.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.32.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.32.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.32.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.33.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.33.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.33.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.33.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.33.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.33.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.34.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.34.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.34.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.34.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.34.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.34.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.35.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.35.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.35.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.35.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.35.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.35.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.36.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.36.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.36.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.36.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.36.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.36.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.37.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.37.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.37.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.37.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.37.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.37.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.38.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.38.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.38.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.38.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.38.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.38.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.39.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.39.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.39.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.39.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.39.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.39.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.4.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.4.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.4.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.4.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.4.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.4.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.40.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.40.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.40.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.40.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.40.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.40.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.41.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.41.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.41.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.41.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.41.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.41.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.42.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.42.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.42.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.42.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.42.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.42.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.43.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.43.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.43.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.43.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.43.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.43.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.44.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.44.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.44.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.44.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.44.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.44.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.45.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.45.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.45.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.45.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.45.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.45.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.46.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.46.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.46.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.46.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.46.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.46.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.47.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.47.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.47.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.47.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.47.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.47.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.48.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.48.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.48.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.48.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.48.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.48.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.49.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.49.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.49.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.49.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.49.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.49.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.5.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.5.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.5.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.5.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.5.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.5.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.50.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.50.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.50.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.50.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.50.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.50.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.51.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.51.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.51.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.51.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.51.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.51.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.52.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.52.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.52.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.52.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.52.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.52.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.53.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.53.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.53.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.53.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.53.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.53.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.54.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.54.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.54.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.54.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.54.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.54.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.55.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.55.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.55.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.55.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.55.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.55.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.56.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.56.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.56.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.56.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.56.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.56.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.57.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.57.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.57.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.57.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.57.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.57.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.58.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.58.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.58.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.58.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.58.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.58.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.59.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.59.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.59.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.59.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.59.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.59.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.6.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.6.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.6.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.6.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.6.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.6.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.60.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.60.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.60.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.60.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.60.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.60.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.61.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.61.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.61.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.61.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.61.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.61.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.62.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.62.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.62.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.62.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.62.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.62.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.63.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.63.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.63.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.63.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.63.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.63.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.64.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.64.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.64.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.64.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.64.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.64.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.65.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.65.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.65.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.65.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.65.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.65.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.66.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.66.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.66.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.66.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.66.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.66.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.67.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.67.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.67.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.67.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.67.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.67.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.68.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.68.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.68.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.68.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.68.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.68.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.69.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.69.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.69.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.69.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.69.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.69.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.7.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.7.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.7.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.7.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.7.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.7.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.70.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.70.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.70.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.70.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.70.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.70.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.71.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.71.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.71.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.71.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.71.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.71.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.72.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.72.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.72.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.72.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.72.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.72.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.73.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.73.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.73.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.73.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.73.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.73.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.74.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.74.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.74.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.74.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.74.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.74.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.75.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.75.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.75.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.75.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.75.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.75.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.76.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.76.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.76.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.76.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.76.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.76.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.77.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.77.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.77.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.77.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.77.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.77.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.78.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.78.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.78.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.78.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.78.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.78.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.79.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.79.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.79.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.79.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.79.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.79.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.8.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.8.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.8.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.8.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.8.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.8.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.80.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.80.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.80.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.80.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.80.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.80.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.81.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.81.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.81.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.81.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.81.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.81.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.82.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.82.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.82.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.82.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.82.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.82.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.83.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.83.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.83.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.83.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.83.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.83.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.84.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.84.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.84.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.84.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.84.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.84.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.85.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.85.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.85.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.85.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.85.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.85.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.86.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.86.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.86.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.86.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.86.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.86.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.87.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.87.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.87.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.87.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.87.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.87.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.88.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.88.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.88.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.88.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.88.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.88.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.89.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.89.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.89.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.89.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.89.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.89.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.9.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.9.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.9.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.9.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.9.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.9.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.90.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.90.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.90.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.90.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.90.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.90.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.91.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.91.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.91.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.91.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.91.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.91.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.92.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.92.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.92.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.92.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.92.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.92.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.93.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.93.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.93.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.93.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.93.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.93.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.94.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.94.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.94.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.94.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.94.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.94.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.95.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.95.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.95.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.95.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.95.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.95.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.96.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.96.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.96.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.96.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.96.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.96.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.97.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.97.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.97.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.97.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.97.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.97.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.98.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.98.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.98.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.98.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.98.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.98.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.99.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.99.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.99.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.99.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.99.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.experts.99.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.gate.e_score_correction_bias": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.gate.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.shared_experts.down_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.shared_experts.down_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.shared_experts.gate_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.shared_experts.gate_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.shared_experts.up_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.mlp.shared_experts.up_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.post_attention_layernorm.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.self_attn.k_norm.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.self_attn.k_proj.bias": "model-00069-of-00092.safetensors",
+ "model.layers.68.self_attn.k_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.self_attn.k_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.self_attn.o_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.self_attn.o_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.self_attn.q_norm.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.self_attn.q_proj.bias": "model-00069-of-00092.safetensors",
+ "model.layers.68.self_attn.q_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.self_attn.q_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.68.self_attn.v_proj.bias": "model-00069-of-00092.safetensors",
+ "model.layers.68.self_attn.v_proj.weight": "model-00069-of-00092.safetensors",
+ "model.layers.68.self_attn.v_proj.weight_scale": "model-00069-of-00092.safetensors",
+ "model.layers.69.input_layernorm.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.0.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.0.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.0.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.0.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.0.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.0.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.1.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.1.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.1.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.1.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.1.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.1.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.10.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.10.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.10.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.10.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.10.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.10.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.100.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.100.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.100.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.100.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.100.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.100.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.101.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.101.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.101.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.101.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.101.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.101.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.102.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.102.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.102.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.102.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.102.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.102.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.103.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.103.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.103.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.103.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.103.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.103.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.104.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.104.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.104.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.104.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.104.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.104.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.105.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.105.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.105.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.105.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.105.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.105.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.106.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.106.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.106.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.106.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.106.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.106.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.107.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.107.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.107.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.107.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.107.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.107.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.108.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.108.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.108.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.108.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.108.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.108.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.109.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.109.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.109.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.109.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.109.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.109.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.11.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.11.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.11.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.11.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.11.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.11.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.110.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.110.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.110.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.110.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.110.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.110.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.111.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.111.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.111.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.111.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.111.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.111.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.112.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.112.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.112.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.112.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.112.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.112.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.113.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.113.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.113.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.113.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.113.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.113.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.114.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.114.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.114.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.114.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.114.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.114.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.115.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.115.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.115.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.115.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.115.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.115.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.116.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.116.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.116.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.116.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.116.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.116.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.117.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.117.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.117.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.117.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.117.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.117.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.118.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.118.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.118.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.118.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.118.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.118.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.119.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.119.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.119.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.119.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.119.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.119.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.12.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.12.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.12.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.12.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.12.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.12.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.120.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.120.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.120.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.120.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.120.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.120.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.121.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.121.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.121.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.121.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.121.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.121.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.122.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.122.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.122.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.122.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.122.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.122.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.123.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.123.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.123.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.123.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.123.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.123.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.124.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.124.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.124.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.124.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.124.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.124.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.125.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.125.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.125.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.125.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.125.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.125.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.126.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.126.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.126.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.126.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.126.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.126.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.127.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.127.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.127.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.127.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.127.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.127.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.128.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.128.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.128.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.128.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.128.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.128.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.129.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.129.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.129.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.129.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.129.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.129.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.13.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.13.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.13.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.13.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.13.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.13.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.130.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.130.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.130.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.130.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.130.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.130.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.131.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.131.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.131.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.131.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.131.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.131.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.132.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.132.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.132.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.132.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.132.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.132.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.133.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.133.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.133.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.133.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.133.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.133.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.134.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.134.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.134.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.134.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.134.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.134.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.135.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.135.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.135.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.135.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.135.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.135.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.136.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.136.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.136.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.136.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.136.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.136.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.137.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.137.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.137.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.137.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.137.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.137.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.138.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.138.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.138.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.138.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.138.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.138.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.139.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.139.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.139.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.139.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.139.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.139.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.14.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.14.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.14.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.14.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.14.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.14.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.140.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.140.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.140.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.140.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.140.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.140.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.141.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.141.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.141.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.141.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.141.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.141.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.142.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.142.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.142.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.142.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.142.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.142.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.143.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.143.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.143.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.143.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.143.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.143.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.144.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.144.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.144.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.144.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.144.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.144.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.145.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.145.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.145.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.145.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.145.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.145.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.146.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.146.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.146.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.146.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.146.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.146.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.147.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.147.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.147.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.147.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.147.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.147.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.148.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.148.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.148.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.148.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.148.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.148.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.149.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.149.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.149.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.149.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.149.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.149.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.15.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.15.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.15.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.15.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.15.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.15.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.150.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.150.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.150.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.150.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.150.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.150.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.151.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.151.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.151.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.151.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.151.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.151.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.152.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.152.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.152.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.152.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.152.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.152.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.153.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.153.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.153.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.153.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.153.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.153.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.154.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.154.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.154.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.154.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.154.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.154.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.155.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.155.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.155.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.155.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.155.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.155.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.156.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.156.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.156.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.156.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.156.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.156.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.157.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.157.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.157.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.157.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.157.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.157.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.158.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.158.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.158.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.158.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.158.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.158.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.159.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.159.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.159.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.159.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.159.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.159.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.16.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.16.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.16.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.16.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.16.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.16.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.17.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.17.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.17.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.17.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.17.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.17.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.18.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.18.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.18.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.18.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.18.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.18.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.19.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.19.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.19.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.19.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.19.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.19.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.2.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.2.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.2.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.2.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.2.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.2.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.20.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.20.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.20.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.20.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.20.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.20.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.21.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.21.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.21.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.21.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.21.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.21.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.22.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.22.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.22.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.22.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.22.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.22.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.23.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.23.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.23.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.23.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.23.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.23.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.24.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.24.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.24.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.24.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.24.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.24.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.25.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.25.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.25.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.25.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.25.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.25.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.26.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.26.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.26.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.26.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.26.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.26.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.27.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.27.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.27.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.27.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.27.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.27.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.28.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.28.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.28.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.28.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.28.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.28.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.29.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.29.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.29.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.29.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.29.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.29.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.3.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.3.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.3.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.3.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.3.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.3.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.30.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.30.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.30.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.30.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.30.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.30.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.31.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.31.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.31.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.31.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.31.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.31.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.32.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.32.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.32.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.32.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.32.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.32.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.33.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.33.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.33.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.33.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.33.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.33.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.34.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.34.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.34.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.34.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.34.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.34.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.35.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.35.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.35.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.35.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.35.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.35.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.36.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.36.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.36.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.36.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.36.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.36.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.37.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.37.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.37.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.37.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.37.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.37.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.38.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.38.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.38.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.38.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.38.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.38.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.39.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.39.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.39.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.39.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.39.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.39.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.4.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.4.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.4.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.4.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.4.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.4.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.40.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.40.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.40.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.40.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.40.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.40.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.41.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.41.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.41.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.41.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.41.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.41.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.42.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.42.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.42.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.42.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.42.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.42.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.43.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.43.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.43.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.43.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.43.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.43.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.44.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.44.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.44.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.44.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.44.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.44.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.45.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.45.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.45.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.45.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.45.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.45.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.46.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.46.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.46.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.46.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.46.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.46.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.47.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.47.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.47.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.47.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.47.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.47.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.48.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.48.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.48.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.48.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.48.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.48.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.49.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.49.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.49.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.49.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.49.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.49.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.5.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.5.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.5.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.5.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.5.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.5.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.50.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.50.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.50.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.50.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.50.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.50.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.51.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.51.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.51.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.51.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.51.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.51.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.52.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.52.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.52.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.52.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.52.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.52.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.53.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.53.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.53.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.53.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.53.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.53.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.54.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.54.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.54.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.54.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.54.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.54.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.55.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.55.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.55.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.55.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.55.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.55.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.56.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.56.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.56.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.56.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.56.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.56.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.57.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.57.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.57.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.57.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.57.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.57.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.58.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.58.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.58.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.58.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.58.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.58.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.59.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.59.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.59.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.59.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.59.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.59.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.6.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.6.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.6.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.6.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.6.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.6.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.60.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.60.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.60.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.60.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.60.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.60.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.61.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.61.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.61.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.61.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.61.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.61.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.62.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.62.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.62.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.62.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.62.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.62.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.63.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.63.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.63.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.63.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.63.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.63.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.64.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.64.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.64.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.64.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.64.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.64.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.65.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.65.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.65.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.65.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.65.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.65.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.66.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.66.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.66.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.66.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.66.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.66.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.67.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.67.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.67.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.67.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.67.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.67.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.68.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.68.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.68.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.68.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.68.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.68.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.69.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.69.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.69.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.69.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.69.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.69.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.7.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.7.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.7.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.7.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.7.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.7.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.70.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.70.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.70.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.70.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.70.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.70.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.71.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.71.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.71.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.71.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.71.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.71.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.72.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.72.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.72.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.72.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.72.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.72.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.73.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.73.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.73.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.73.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.73.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.73.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.74.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.74.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.74.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.74.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.74.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.74.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.75.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.75.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.75.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.75.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.75.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.75.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.76.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.76.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.76.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.76.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.76.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.76.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.77.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.77.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.77.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.77.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.77.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.77.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.78.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.78.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.78.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.78.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.78.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.78.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.79.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.79.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.79.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.79.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.79.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.79.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.8.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.8.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.8.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.8.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.8.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.8.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.80.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.80.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.80.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.80.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.80.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.80.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.81.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.81.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.81.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.81.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.81.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.81.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.82.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.82.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.82.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.82.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.82.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.82.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.83.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.83.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.83.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.83.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.83.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.83.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.84.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.84.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.84.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.84.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.84.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.84.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.85.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.85.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.85.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.85.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.85.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.85.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.86.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.86.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.86.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.86.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.86.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.86.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.87.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.87.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.87.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.87.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.87.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.87.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.88.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.88.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.88.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.88.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.88.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.88.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.89.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.89.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.89.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.89.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.89.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.89.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.9.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.9.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.9.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.9.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.9.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.9.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.90.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.90.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.90.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.90.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.90.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.90.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.91.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.91.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.91.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.91.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.91.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.91.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.92.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.92.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.92.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.92.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.92.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.92.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.93.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.93.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.93.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.93.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.93.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.93.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.94.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.94.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.94.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.94.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.94.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.94.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.95.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.95.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.95.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.95.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.95.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.95.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.96.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.96.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.96.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.96.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.96.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.96.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.97.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.97.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.97.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.97.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.97.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.97.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.98.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.98.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.98.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.98.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.98.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.98.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.99.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.99.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.99.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.99.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.99.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.experts.99.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.gate.e_score_correction_bias": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.gate.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.shared_experts.down_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.shared_experts.down_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.shared_experts.gate_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.shared_experts.gate_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.shared_experts.up_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.mlp.shared_experts.up_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.post_attention_layernorm.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.self_attn.k_norm.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.self_attn.k_proj.bias": "model-00070-of-00092.safetensors",
+ "model.layers.69.self_attn.k_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.self_attn.k_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.self_attn.o_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.self_attn.o_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.self_attn.q_norm.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.self_attn.q_proj.bias": "model-00070-of-00092.safetensors",
+ "model.layers.69.self_attn.q_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.self_attn.q_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.69.self_attn.v_proj.bias": "model-00070-of-00092.safetensors",
+ "model.layers.69.self_attn.v_proj.weight": "model-00070-of-00092.safetensors",
+ "model.layers.69.self_attn.v_proj.weight_scale": "model-00070-of-00092.safetensors",
+ "model.layers.7.input_layernorm.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.0.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.0.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.0.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.0.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.0.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.0.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.1.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.1.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.1.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.1.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.1.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.1.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.10.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.10.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.10.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.10.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.10.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.10.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.100.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.100.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.100.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.100.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.100.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.100.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.101.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.101.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.101.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.101.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.101.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.101.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.102.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.102.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.102.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.102.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.102.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.102.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.103.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.103.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.103.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.103.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.103.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.103.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.104.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.104.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.104.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.104.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.104.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.104.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.105.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.105.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.105.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.105.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.105.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.105.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.106.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.106.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.106.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.106.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.106.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.106.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.107.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.107.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.107.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.107.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.107.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.107.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.108.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.108.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.108.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.108.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.108.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.108.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.109.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.109.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.109.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.109.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.109.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.109.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.11.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.11.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.11.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.11.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.11.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.11.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.110.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.110.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.110.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.110.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.110.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.110.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.111.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.111.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.111.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.111.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.111.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.111.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.112.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.112.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.112.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.112.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.112.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.112.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.113.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.113.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.113.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.113.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.113.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.113.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.114.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.114.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.114.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.114.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.114.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.114.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.115.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.115.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.115.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.115.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.115.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.115.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.116.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.116.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.116.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.116.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.116.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.116.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.117.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.117.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.117.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.117.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.117.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.117.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.118.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.118.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.118.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.118.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.118.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.118.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.119.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.119.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.119.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.119.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.119.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.119.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.12.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.12.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.12.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.12.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.12.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.12.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.120.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.120.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.120.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.120.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.120.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.120.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.121.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.121.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.121.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.121.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.121.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.121.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.122.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.122.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.122.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.122.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.122.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.122.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.123.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.123.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.123.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.123.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.123.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.123.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.124.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.124.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.124.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.124.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.124.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.124.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.125.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.125.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.125.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.125.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.125.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.125.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.126.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.126.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.126.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.126.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.126.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.126.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.127.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.127.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.127.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.127.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.127.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.127.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.128.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.128.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.128.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.128.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.128.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.128.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.129.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.129.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.129.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.129.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.129.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.129.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.13.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.13.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.13.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.13.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.13.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.13.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.130.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.130.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.130.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.130.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.130.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.130.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.131.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.131.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.131.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.131.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.131.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.131.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.132.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.132.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.132.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.132.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.132.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.132.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.133.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.133.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.133.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.133.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.133.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.133.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.134.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.134.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.134.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.134.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.134.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.134.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.135.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.135.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.135.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.135.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.135.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.135.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.136.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.136.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.136.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.136.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.136.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.136.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.137.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.137.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.137.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.137.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.137.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.137.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.138.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.138.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.138.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.138.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.138.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.138.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.139.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.139.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.139.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.139.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.139.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.139.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.14.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.14.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.14.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.14.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.14.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.14.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.140.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.140.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.140.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.140.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.140.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.140.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.141.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.141.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.141.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.141.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.141.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.141.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.142.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.142.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.142.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.142.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.142.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.142.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.143.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.143.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.143.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.143.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.143.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.143.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.144.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.144.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.144.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.144.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.144.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.144.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.145.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.145.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.145.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.145.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.145.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.145.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.146.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.146.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.146.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.146.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.146.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.146.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.147.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.147.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.147.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.147.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.147.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.147.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.148.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.148.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.148.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.148.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.148.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.148.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.149.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.149.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.149.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.149.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.149.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.149.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.15.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.15.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.15.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.15.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.15.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.15.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.150.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.150.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.150.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.150.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.150.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.150.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.151.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.151.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.151.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.151.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.151.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.151.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.152.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.152.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.152.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.152.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.152.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.152.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.153.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.153.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.153.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.153.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.153.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.153.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.154.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.154.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.154.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.154.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.154.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.154.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.155.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.155.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.155.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.155.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.155.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.155.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.156.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.156.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.156.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.156.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.156.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.156.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.157.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.157.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.157.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.157.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.157.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.157.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.158.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.158.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.158.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.158.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.158.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.158.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.159.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.159.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.159.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.159.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.159.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.159.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.16.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.16.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.16.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.16.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.16.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.16.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.17.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.17.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.17.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.17.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.17.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.17.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.18.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.18.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.18.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.18.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.18.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.18.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.19.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.19.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.19.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.19.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.19.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.19.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.2.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.2.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.2.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.2.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.2.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.2.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.20.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.20.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.20.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.20.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.20.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.20.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.21.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.21.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.21.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.21.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.21.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.21.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.22.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.22.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.22.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.22.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.22.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.22.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.23.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.23.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.23.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.23.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.23.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.23.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.24.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.24.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.24.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.24.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.24.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.24.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.25.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.25.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.25.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.25.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.25.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.25.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.26.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.26.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.26.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.26.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.26.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.26.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.27.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.27.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.27.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.27.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.27.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.27.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.28.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.28.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.28.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.28.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.28.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.28.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.29.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.29.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.29.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.29.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.29.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.29.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.3.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.3.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.3.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.3.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.3.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.3.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.30.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.30.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.30.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.30.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.30.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.30.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.31.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.31.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.31.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.31.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.31.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.31.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.32.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.32.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.32.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.32.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.32.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.32.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.33.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.33.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.33.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.33.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.33.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.33.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.34.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.34.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.34.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.34.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.34.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.34.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.35.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.35.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.35.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.35.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.35.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.35.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.36.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.36.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.36.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.36.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.36.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.36.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.37.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.37.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.37.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.37.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.37.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.37.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.38.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.38.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.38.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.38.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.38.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.38.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.39.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.39.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.39.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.39.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.39.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.39.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.4.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.4.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.4.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.4.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.4.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.4.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.40.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.40.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.40.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.40.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.40.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.40.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.41.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.41.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.41.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.41.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.41.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.41.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.42.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.42.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.42.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.42.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.42.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.42.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.43.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.43.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.43.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.43.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.43.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.43.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.44.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.44.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.44.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.44.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.44.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.44.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.45.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.45.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.45.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.45.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.45.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.45.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.46.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.46.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.46.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.46.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.46.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.46.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.47.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.47.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.47.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.47.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.47.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.47.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.48.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.48.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.48.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.48.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.48.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.48.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.49.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.49.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.49.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.49.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.49.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.49.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.5.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.5.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.5.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.5.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.5.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.5.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.50.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.50.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.50.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.50.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.50.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.50.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.51.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.51.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.51.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.51.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.51.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.51.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.52.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.52.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.52.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.52.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.52.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.52.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.53.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.53.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.53.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.53.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.53.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.53.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.54.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.54.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.54.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.54.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.54.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.54.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.55.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.55.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.55.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.55.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.55.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.55.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.56.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.56.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.56.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.56.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.56.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.56.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.57.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.57.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.57.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.57.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.57.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.57.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.58.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.58.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.58.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.58.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.58.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.58.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.59.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.59.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.59.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.59.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.59.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.59.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.6.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.6.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.6.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.6.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.6.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.6.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.60.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.60.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.60.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.60.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.60.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.60.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.61.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.61.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.61.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.61.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.61.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.61.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.62.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.62.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.62.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.62.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.62.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.62.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.63.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.63.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.63.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.63.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.63.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.63.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.64.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.64.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.64.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.64.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.64.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.64.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.65.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.65.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.65.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.65.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.65.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.65.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.66.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.66.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.66.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.66.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.66.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.66.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.67.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.67.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.67.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.67.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.67.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.67.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.68.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.68.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.68.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.68.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.68.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.68.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.69.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.69.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.69.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.69.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.69.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.69.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.7.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.7.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.7.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.7.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.7.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.7.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.70.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.70.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.70.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.70.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.70.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.70.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.71.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.71.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.71.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.71.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.71.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.71.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.72.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.72.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.72.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.72.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.72.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.72.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.73.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.73.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.73.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.73.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.73.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.73.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.74.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.74.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.74.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.74.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.74.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.74.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.75.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.75.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.75.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.75.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.75.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.75.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.76.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.76.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.76.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.76.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.76.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.76.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.77.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.77.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.77.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.77.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.77.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.77.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.78.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.78.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.78.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.78.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.78.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.78.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.79.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.79.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.79.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.79.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.79.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.79.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.8.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.8.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.8.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.8.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.8.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.8.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.80.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.80.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.80.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.80.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.80.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.80.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.81.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.81.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.81.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.81.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.81.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.81.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.82.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.82.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.82.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.82.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.82.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.82.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.83.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.83.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.83.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.83.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.83.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.83.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.84.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.84.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.84.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.84.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.84.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.84.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.85.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.85.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.85.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.85.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.85.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.85.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.86.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.86.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.86.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.86.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.86.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.86.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.87.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.87.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.87.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.87.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.87.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.87.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.88.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.88.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.88.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.88.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.88.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.88.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.89.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.89.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.89.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.89.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.89.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.89.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.9.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.9.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.9.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.9.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.9.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.9.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.90.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.90.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.90.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.90.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.90.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.90.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.91.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.91.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.91.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.91.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.91.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.91.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.92.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.92.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.92.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.92.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.92.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.92.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.93.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.93.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.93.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.93.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.93.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.93.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.94.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.94.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.94.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.94.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.94.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.94.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.95.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.95.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.95.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.95.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.95.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.95.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.96.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.96.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.96.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.96.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.96.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.96.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.97.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.97.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.97.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.97.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.97.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.97.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.98.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.98.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.98.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.98.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.98.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.98.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.99.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.99.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.99.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.99.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.99.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.experts.99.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.gate.e_score_correction_bias": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.gate.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.shared_experts.down_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.shared_experts.down_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.shared_experts.gate_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.shared_experts.gate_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.shared_experts.up_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.mlp.shared_experts.up_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.post_attention_layernorm.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.self_attn.k_norm.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.self_attn.k_proj.bias": "model-00008-of-00092.safetensors",
+ "model.layers.7.self_attn.k_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.self_attn.k_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.self_attn.o_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.self_attn.o_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.self_attn.q_norm.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.self_attn.q_proj.bias": "model-00008-of-00092.safetensors",
+ "model.layers.7.self_attn.q_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.self_attn.q_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.7.self_attn.v_proj.bias": "model-00008-of-00092.safetensors",
+ "model.layers.7.self_attn.v_proj.weight": "model-00008-of-00092.safetensors",
+ "model.layers.7.self_attn.v_proj.weight_scale": "model-00008-of-00092.safetensors",
+ "model.layers.70.input_layernorm.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.0.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.0.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.0.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.0.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.0.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.0.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.1.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.1.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.1.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.1.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.1.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.1.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.10.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.10.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.10.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.10.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.10.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.10.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.100.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.100.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.100.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.100.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.100.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.100.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.101.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.101.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.101.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.101.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.101.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.101.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.102.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.102.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.102.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.102.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.102.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.102.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.103.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.103.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.103.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.103.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.103.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.103.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.104.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.104.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.104.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.104.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.104.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.104.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.105.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.105.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.105.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.105.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.105.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.105.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.106.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.106.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.106.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.106.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.106.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.106.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.107.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.107.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.107.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.107.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.107.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.107.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.108.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.108.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.108.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.108.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.108.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.108.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.109.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.109.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.109.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.109.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.109.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.109.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.11.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.11.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.11.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.11.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.11.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.11.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.110.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.110.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.110.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.110.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.110.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.110.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.111.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.111.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.111.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.111.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.111.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.111.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.112.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.112.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.112.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.112.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.112.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.112.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.113.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.113.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.113.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.113.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.113.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.113.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.114.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.114.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.114.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.114.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.114.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.114.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.115.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.115.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.115.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.115.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.115.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.115.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.116.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.116.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.116.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.116.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.116.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.116.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.117.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.117.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.117.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.117.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.117.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.117.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.118.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.118.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.118.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.118.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.118.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.118.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.119.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.119.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.119.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.119.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.119.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.119.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.12.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.12.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.12.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.12.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.12.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.12.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.120.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.120.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.120.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.120.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.120.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.120.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.121.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.121.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.121.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.121.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.121.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.121.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.122.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.122.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.122.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.122.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.122.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.122.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.123.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.123.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.123.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.123.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.123.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.123.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.124.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.124.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.124.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.124.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.124.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.124.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.125.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.125.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.125.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.125.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.125.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.125.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.126.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.126.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.126.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.126.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.126.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.126.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.127.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.127.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.127.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.127.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.127.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.127.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.128.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.128.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.128.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.128.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.128.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.128.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.129.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.129.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.129.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.129.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.129.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.129.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.13.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.13.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.13.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.13.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.13.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.13.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.130.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.130.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.130.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.130.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.130.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.130.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.131.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.131.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.131.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.131.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.131.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.131.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.132.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.132.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.132.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.132.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.132.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.132.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.133.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.133.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.133.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.133.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.133.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.133.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.134.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.134.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.134.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.134.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.134.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.134.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.135.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.135.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.135.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.135.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.135.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.135.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.136.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.136.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.136.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.136.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.136.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.136.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.137.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.137.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.137.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.137.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.137.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.137.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.138.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.138.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.138.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.138.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.138.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.138.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.139.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.139.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.139.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.139.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.139.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.139.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.14.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.14.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.14.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.14.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.14.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.14.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.140.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.140.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.140.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.140.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.140.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.140.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.141.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.141.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.141.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.141.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.141.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.141.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.142.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.142.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.142.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.142.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.142.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.142.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.143.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.143.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.143.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.143.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.143.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.143.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.144.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.144.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.144.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.144.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.144.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.144.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.145.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.145.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.145.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.145.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.145.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.145.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.146.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.146.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.146.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.146.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.146.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.146.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.147.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.147.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.147.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.147.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.147.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.147.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.148.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.148.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.148.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.148.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.148.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.148.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.149.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.149.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.149.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.149.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.149.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.149.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.15.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.15.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.15.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.15.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.15.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.15.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.150.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.150.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.150.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.150.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.150.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.150.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.151.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.151.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.151.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.151.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.151.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.151.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.152.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.152.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.152.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.152.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.152.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.152.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.153.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.153.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.153.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.153.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.153.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.153.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.154.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.154.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.154.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.154.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.154.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.154.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.155.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.155.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.155.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.155.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.155.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.155.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.156.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.156.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.156.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.156.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.156.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.156.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.157.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.157.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.157.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.157.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.157.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.157.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.158.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.158.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.158.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.158.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.158.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.158.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.159.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.159.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.159.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.159.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.159.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.159.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.16.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.16.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.16.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.16.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.16.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.16.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.17.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.17.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.17.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.17.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.17.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.17.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.18.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.18.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.18.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.18.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.18.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.18.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.19.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.19.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.19.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.19.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.19.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.19.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.2.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.2.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.2.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.2.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.2.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.2.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.20.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.20.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.20.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.20.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.20.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.20.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.21.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.21.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.21.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.21.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.21.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.21.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.22.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.22.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.22.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.22.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.22.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.22.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.23.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.23.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.23.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.23.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.23.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.23.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.24.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.24.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.24.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.24.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.24.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.24.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.25.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.25.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.25.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.25.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.25.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.25.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.26.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.26.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.26.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.26.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.26.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.26.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.27.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.27.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.27.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.27.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.27.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.27.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.28.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.28.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.28.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.28.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.28.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.28.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.29.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.29.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.29.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.29.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.29.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.29.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.3.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.3.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.3.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.3.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.3.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.3.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.30.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.30.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.30.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.30.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.30.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.30.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.31.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.31.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.31.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.31.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.31.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.31.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.32.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.32.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.32.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.32.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.32.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.32.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.33.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.33.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.33.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.33.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.33.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.33.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.34.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.34.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.34.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.34.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.34.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.34.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.35.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.35.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.35.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.35.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.35.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.35.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.36.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.36.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.36.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.36.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.36.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.36.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.37.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.37.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.37.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.37.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.37.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.37.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.38.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.38.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.38.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.38.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.38.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.38.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.39.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.39.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.39.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.39.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.39.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.39.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.4.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.4.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.4.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.4.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.4.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.4.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.40.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.40.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.40.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.40.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.40.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.40.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.41.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.41.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.41.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.41.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.41.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.41.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.42.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.42.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.42.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.42.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.42.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.42.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.43.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.43.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.43.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.43.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.43.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.43.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.44.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.44.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.44.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.44.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.44.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.44.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.45.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.45.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.45.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.45.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.45.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.45.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.46.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.46.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.46.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.46.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.46.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.46.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.47.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.47.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.47.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.47.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.47.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.47.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.48.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.48.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.48.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.48.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.48.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.48.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.49.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.49.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.49.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.49.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.49.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.49.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.5.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.5.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.5.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.5.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.5.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.5.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.50.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.50.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.50.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.50.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.50.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.50.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.51.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.51.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.51.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.51.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.51.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.51.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.52.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.52.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.52.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.52.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.52.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.52.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.53.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.53.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.53.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.53.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.53.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.53.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.54.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.54.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.54.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.54.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.54.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.54.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.55.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.55.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.55.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.55.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.55.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.55.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.56.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.56.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.56.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.56.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.56.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.56.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.57.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.57.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.57.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.57.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.57.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.57.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.58.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.58.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.58.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.58.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.58.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.58.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.59.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.59.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.59.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.59.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.59.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.59.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.6.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.6.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.6.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.6.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.6.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.6.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.60.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.60.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.60.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.60.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.60.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.60.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.61.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.61.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.61.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.61.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.61.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.61.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.62.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.62.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.62.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.62.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.62.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.62.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.63.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.63.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.63.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.63.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.63.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.63.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.64.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.64.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.64.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.64.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.64.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.64.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.65.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.65.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.65.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.65.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.65.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.65.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.66.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.66.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.66.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.66.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.66.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.66.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.67.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.67.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.67.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.67.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.67.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.67.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.68.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.68.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.68.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.68.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.68.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.68.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.69.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.69.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.69.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.69.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.69.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.69.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.7.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.7.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.7.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.7.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.7.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.7.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.70.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.70.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.70.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.70.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.70.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.70.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.71.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.71.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.71.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.71.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.71.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.71.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.72.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.72.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.72.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.72.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.72.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.72.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.73.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.73.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.73.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.73.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.73.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.73.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.74.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.74.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.74.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.74.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.74.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.74.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.75.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.75.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.75.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.75.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.75.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.75.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.76.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.76.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.76.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.76.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.76.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.76.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.77.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.77.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.77.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.77.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.77.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.77.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.78.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.78.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.78.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.78.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.78.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.78.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.79.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.79.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.79.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.79.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.79.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.79.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.8.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.8.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.8.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.8.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.8.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.8.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.80.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.80.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.80.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.80.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.80.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.80.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.81.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.81.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.81.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.81.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.81.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.81.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.82.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.82.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.82.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.82.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.82.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.82.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.83.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.83.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.83.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.83.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.83.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.83.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.84.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.84.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.84.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.84.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.84.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.84.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.85.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.85.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.85.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.85.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.85.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.85.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.86.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.86.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.86.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.86.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.86.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.86.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.87.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.87.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.87.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.87.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.87.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.87.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.88.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.88.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.88.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.88.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.88.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.88.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.89.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.89.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.89.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.89.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.89.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.89.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.9.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.9.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.9.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.9.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.9.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.9.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.90.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.90.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.90.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.90.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.90.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.90.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.91.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.91.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.91.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.91.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.91.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.91.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.92.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.92.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.92.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.92.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.92.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.92.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.93.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.93.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.93.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.93.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.93.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.93.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.94.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.94.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.94.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.94.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.94.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.94.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.95.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.95.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.95.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.95.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.95.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.95.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.96.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.96.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.96.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.96.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.96.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.96.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.97.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.97.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.97.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.97.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.97.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.97.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.98.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.98.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.98.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.98.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.98.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.98.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.99.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.99.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.99.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.99.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.99.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.experts.99.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.gate.e_score_correction_bias": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.gate.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.shared_experts.down_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.shared_experts.down_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.shared_experts.gate_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.shared_experts.gate_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.shared_experts.up_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.mlp.shared_experts.up_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.post_attention_layernorm.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.self_attn.k_norm.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.self_attn.k_proj.bias": "model-00071-of-00092.safetensors",
+ "model.layers.70.self_attn.k_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.self_attn.k_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.self_attn.o_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.self_attn.o_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.self_attn.q_norm.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.self_attn.q_proj.bias": "model-00071-of-00092.safetensors",
+ "model.layers.70.self_attn.q_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.self_attn.q_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.70.self_attn.v_proj.bias": "model-00071-of-00092.safetensors",
+ "model.layers.70.self_attn.v_proj.weight": "model-00071-of-00092.safetensors",
+ "model.layers.70.self_attn.v_proj.weight_scale": "model-00071-of-00092.safetensors",
+ "model.layers.71.input_layernorm.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.0.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.0.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.0.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.0.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.0.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.0.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.1.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.1.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.1.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.1.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.1.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.1.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.10.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.10.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.10.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.10.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.10.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.10.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.100.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.100.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.100.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.100.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.100.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.100.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.101.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.101.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.101.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.101.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.101.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.101.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.102.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.102.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.102.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.102.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.102.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.102.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.103.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.103.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.103.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.103.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.103.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.103.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.104.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.104.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.104.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.104.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.104.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.104.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.105.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.105.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.105.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.105.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.105.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.105.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.106.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.106.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.106.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.106.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.106.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.106.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.107.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.107.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.107.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.107.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.107.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.107.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.108.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.108.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.108.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.108.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.108.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.108.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.109.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.109.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.109.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.109.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.109.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.109.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.11.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.11.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.11.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.11.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.11.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.11.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.110.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.110.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.110.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.110.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.110.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.110.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.111.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.111.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.111.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.111.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.111.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.111.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.112.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.112.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.112.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.112.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.112.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.112.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.113.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.113.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.113.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.113.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.113.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.113.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.114.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.114.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.114.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.114.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.114.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.114.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.115.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.115.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.115.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.115.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.115.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.115.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.116.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.116.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.116.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.116.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.116.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.116.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.117.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.117.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.117.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.117.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.117.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.117.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.118.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.118.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.118.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.118.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.118.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.118.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.119.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.119.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.119.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.119.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.119.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.119.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.12.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.12.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.12.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.12.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.12.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.12.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.120.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.120.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.120.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.120.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.120.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.120.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.121.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.121.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.121.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.121.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.121.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.121.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.122.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.122.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.122.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.122.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.122.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.122.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.123.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.123.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.123.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.123.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.123.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.123.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.124.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.124.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.124.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.124.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.124.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.124.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.125.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.125.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.125.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.125.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.125.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.125.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.126.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.126.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.126.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.126.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.126.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.126.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.127.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.127.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.127.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.127.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.127.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.127.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.128.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.128.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.128.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.128.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.128.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.128.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.129.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.129.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.129.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.129.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.129.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.129.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.13.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.13.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.13.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.13.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.13.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.13.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.130.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.130.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.130.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.130.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.130.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.130.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.131.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.131.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.131.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.131.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.131.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.131.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.132.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.132.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.132.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.132.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.132.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.132.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.133.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.133.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.133.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.133.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.133.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.133.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.134.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.134.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.134.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.134.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.134.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.134.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.135.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.135.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.135.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.135.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.135.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.135.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.136.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.136.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.136.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.136.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.136.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.136.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.137.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.137.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.137.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.137.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.137.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.137.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.138.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.138.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.138.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.138.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.138.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.138.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.139.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.139.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.139.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.139.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.139.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.139.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.14.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.14.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.14.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.14.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.14.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.14.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.140.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.140.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.140.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.140.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.140.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.140.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.141.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.141.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.141.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.141.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.141.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.141.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.142.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.142.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.142.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.142.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.142.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.142.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.143.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.143.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.143.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.143.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.143.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.143.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.144.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.144.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.144.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.144.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.144.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.144.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.145.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.145.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.145.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.145.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.145.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.145.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.146.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.146.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.146.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.146.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.146.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.146.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.147.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.147.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.147.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.147.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.147.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.147.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.148.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.148.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.148.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.148.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.148.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.148.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.149.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.149.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.149.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.149.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.149.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.149.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.15.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.15.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.15.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.15.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.15.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.15.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.150.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.150.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.150.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.150.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.150.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.150.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.151.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.151.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.151.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.151.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.151.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.151.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.152.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.152.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.152.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.152.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.152.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.152.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.153.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.153.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.153.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.153.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.153.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.153.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.154.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.154.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.154.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.154.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.154.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.154.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.155.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.155.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.155.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.155.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.155.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.155.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.156.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.156.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.156.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.156.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.156.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.156.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.157.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.157.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.157.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.157.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.157.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.157.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.158.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.158.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.158.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.158.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.158.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.158.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.159.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.159.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.159.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.159.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.159.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.159.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.16.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.16.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.16.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.16.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.16.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.16.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.17.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.17.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.17.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.17.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.17.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.17.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.18.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.18.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.18.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.18.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.18.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.18.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.19.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.19.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.19.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.19.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.19.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.19.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.2.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.2.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.2.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.2.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.2.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.2.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.20.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.20.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.20.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.20.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.20.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.20.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.21.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.21.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.21.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.21.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.21.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.21.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.22.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.22.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.22.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.22.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.22.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.22.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.23.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.23.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.23.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.23.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.23.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.23.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.24.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.24.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.24.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.24.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.24.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.24.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.25.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.25.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.25.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.25.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.25.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.25.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.26.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.26.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.26.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.26.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.26.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.26.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.27.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.27.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.27.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.27.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.27.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.27.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.28.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.28.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.28.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.28.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.28.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.28.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.29.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.29.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.29.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.29.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.29.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.29.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.3.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.3.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.3.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.3.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.3.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.3.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.30.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.30.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.30.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.30.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.30.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.30.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.31.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.31.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.31.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.31.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.31.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.31.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.32.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.32.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.32.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.32.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.32.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.32.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.33.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.33.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.33.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.33.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.33.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.33.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.34.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.34.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.34.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.34.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.34.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.34.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.35.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.35.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.35.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.35.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.35.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.35.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.36.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.36.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.36.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.36.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.36.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.36.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.37.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.37.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.37.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.37.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.37.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.37.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.38.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.38.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.38.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.38.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.38.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.38.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.39.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.39.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.39.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.39.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.39.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.39.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.4.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.4.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.4.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.4.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.4.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.4.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.40.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.40.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.40.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.40.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.40.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.40.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.41.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.41.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.41.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.41.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.41.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.41.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.42.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.42.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.42.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.42.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.42.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.42.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.43.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.43.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.43.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.43.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.43.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.43.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.44.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.44.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.44.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.44.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.44.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.44.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.45.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.45.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.45.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.45.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.45.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.45.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.46.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.46.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.46.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.46.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.46.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.46.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.47.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.47.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.47.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.47.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.47.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.47.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.48.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.48.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.48.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.48.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.48.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.48.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.49.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.49.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.49.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.49.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.49.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.49.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.5.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.5.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.5.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.5.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.5.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.5.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.50.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.50.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.50.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.50.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.50.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.50.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.51.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.51.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.51.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.51.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.51.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.51.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.52.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.52.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.52.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.52.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.52.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.52.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.53.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.53.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.53.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.53.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.53.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.53.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.54.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.54.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.54.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.54.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.54.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.54.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.55.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.55.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.55.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.55.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.55.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.55.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.56.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.56.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.56.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.56.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.56.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.56.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.57.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.57.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.57.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.57.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.57.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.57.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.58.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.58.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.58.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.58.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.58.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.58.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.59.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.59.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.59.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.59.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.59.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.59.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.6.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.6.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.6.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.6.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.6.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.6.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.60.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.60.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.60.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.60.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.60.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.60.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.61.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.61.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.61.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.61.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.61.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.61.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.62.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.62.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.62.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.62.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.62.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.62.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.63.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.63.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.63.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.63.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.63.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.63.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.64.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.64.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.64.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.64.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.64.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.64.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.65.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.65.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.65.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.65.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.65.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.65.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.66.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.66.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.66.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.66.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.66.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.66.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.67.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.67.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.67.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.67.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.67.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.67.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.68.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.68.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.68.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.68.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.68.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.68.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.69.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.69.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.69.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.69.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.69.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.69.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.7.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.7.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.7.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.7.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.7.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.7.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.70.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.70.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.70.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.70.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.70.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.70.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.71.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.71.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.71.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.71.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.71.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.71.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.72.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.72.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.72.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.72.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.72.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.72.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.73.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.73.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.73.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.73.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.73.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.73.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.74.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.74.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.74.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.74.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.74.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.74.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.75.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.75.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.75.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.75.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.75.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.75.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.76.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.76.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.76.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.76.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.76.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.76.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.77.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.77.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.77.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.77.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.77.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.77.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.78.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.78.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.78.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.78.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.78.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.78.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.79.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.79.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.79.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.79.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.79.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.79.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.8.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.8.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.8.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.8.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.8.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.8.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.80.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.80.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.80.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.80.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.80.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.80.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.81.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.81.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.81.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.81.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.81.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.81.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.82.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.82.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.82.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.82.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.82.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.82.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.83.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.83.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.83.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.83.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.83.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.83.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.84.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.84.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.84.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.84.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.84.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.84.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.85.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.85.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.85.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.85.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.85.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.85.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.86.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.86.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.86.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.86.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.86.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.86.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.87.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.87.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.87.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.87.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.87.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.87.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.88.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.88.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.88.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.88.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.88.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.88.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.89.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.89.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.89.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.89.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.89.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.89.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.9.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.9.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.9.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.9.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.9.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.9.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.90.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.90.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.90.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.90.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.90.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.90.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.91.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.91.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.91.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.91.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.91.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.91.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.92.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.92.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.92.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.92.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.92.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.92.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.93.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.93.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.93.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.93.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.93.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.93.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.94.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.94.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.94.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.94.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.94.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.94.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.95.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.95.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.95.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.95.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.95.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.95.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.96.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.96.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.96.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.96.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.96.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.96.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.97.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.97.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.97.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.97.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.97.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.97.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.98.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.98.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.98.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.98.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.98.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.98.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.99.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.99.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.99.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.99.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.99.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.experts.99.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.gate.e_score_correction_bias": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.gate.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.shared_experts.down_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.shared_experts.down_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.shared_experts.gate_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.shared_experts.gate_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.shared_experts.up_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.mlp.shared_experts.up_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.post_attention_layernorm.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.self_attn.k_norm.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.self_attn.k_proj.bias": "model-00072-of-00092.safetensors",
+ "model.layers.71.self_attn.k_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.self_attn.k_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.self_attn.o_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.self_attn.o_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.self_attn.q_norm.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.self_attn.q_proj.bias": "model-00072-of-00092.safetensors",
+ "model.layers.71.self_attn.q_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.self_attn.q_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.71.self_attn.v_proj.bias": "model-00072-of-00092.safetensors",
+ "model.layers.71.self_attn.v_proj.weight": "model-00072-of-00092.safetensors",
+ "model.layers.71.self_attn.v_proj.weight_scale": "model-00072-of-00092.safetensors",
+ "model.layers.72.input_layernorm.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.0.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.0.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.0.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.0.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.0.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.0.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.1.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.1.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.1.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.1.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.1.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.1.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.10.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.10.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.10.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.10.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.10.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.10.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.100.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.100.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.100.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.100.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.100.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.100.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.101.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.101.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.101.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.101.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.101.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.101.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.102.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.102.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.102.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.102.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.102.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.102.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.103.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.103.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.103.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.103.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.103.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.103.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.104.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.104.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.104.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.104.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.104.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.104.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.105.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.105.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.105.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.105.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.105.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.105.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.106.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.106.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.106.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.106.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.106.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.106.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.107.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.107.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.107.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.107.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.107.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.107.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.108.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.108.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.108.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.108.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.108.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.108.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.109.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.109.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.109.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.109.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.109.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.109.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.11.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.11.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.11.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.11.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.11.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.11.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.110.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.110.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.110.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.110.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.110.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.110.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.111.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.111.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.111.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.111.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.111.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.111.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.112.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.112.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.112.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.112.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.112.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.112.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.113.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.113.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.113.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.113.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.113.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.113.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.114.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.114.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.114.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.114.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.114.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.114.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.115.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.115.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.115.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.115.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.115.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.115.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.116.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.116.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.116.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.116.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.116.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.116.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.117.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.117.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.117.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.117.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.117.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.117.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.118.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.118.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.118.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.118.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.118.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.118.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.119.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.119.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.119.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.119.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.119.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.119.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.12.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.12.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.12.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.12.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.12.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.12.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.120.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.120.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.120.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.120.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.120.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.120.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.121.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.121.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.121.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.121.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.121.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.121.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.122.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.122.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.122.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.122.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.122.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.122.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.123.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.123.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.123.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.123.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.123.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.123.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.124.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.124.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.124.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.124.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.124.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.124.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.125.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.125.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.125.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.125.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.125.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.125.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.126.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.126.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.126.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.126.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.126.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.126.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.127.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.127.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.127.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.127.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.127.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.127.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.128.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.128.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.128.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.128.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.128.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.128.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.129.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.129.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.129.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.129.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.129.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.129.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.13.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.13.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.13.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.13.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.13.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.13.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.130.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.130.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.130.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.130.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.130.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.130.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.131.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.131.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.131.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.131.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.131.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.131.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.132.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.132.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.132.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.132.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.132.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.132.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.133.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.133.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.133.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.133.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.133.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.133.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.134.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.134.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.134.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.134.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.134.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.134.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.135.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.135.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.135.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.135.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.135.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.135.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.136.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.136.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.136.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.136.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.136.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.136.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.137.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.137.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.137.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.137.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.137.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.137.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.138.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.138.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.138.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.138.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.138.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.138.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.139.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.139.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.139.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.139.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.139.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.139.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.14.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.14.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.14.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.14.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.14.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.14.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.140.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.140.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.140.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.140.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.140.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.140.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.141.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.141.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.141.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.141.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.141.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.141.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.142.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.142.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.142.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.142.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.142.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.142.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.143.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.143.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.143.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.143.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.143.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.143.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.144.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.144.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.144.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.144.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.144.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.144.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.145.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.145.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.145.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.145.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.145.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.145.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.146.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.146.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.146.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.146.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.146.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.146.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.147.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.147.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.147.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.147.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.147.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.147.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.148.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.148.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.148.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.148.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.148.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.148.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.149.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.149.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.149.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.149.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.149.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.149.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.15.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.15.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.15.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.15.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.15.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.15.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.150.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.150.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.150.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.150.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.150.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.150.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.151.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.151.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.151.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.151.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.151.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.151.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.152.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.152.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.152.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.152.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.152.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.152.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.153.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.153.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.153.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.153.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.153.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.153.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.154.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.154.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.154.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.154.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.154.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.154.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.155.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.155.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.155.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.155.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.155.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.155.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.156.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.156.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.156.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.156.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.156.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.156.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.157.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.157.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.157.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.157.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.157.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.157.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.158.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.158.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.158.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.158.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.158.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.158.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.159.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.159.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.159.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.159.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.159.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.159.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.16.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.16.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.16.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.16.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.16.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.16.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.17.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.17.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.17.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.17.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.17.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.17.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.18.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.18.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.18.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.18.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.18.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.18.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.19.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.19.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.19.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.19.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.19.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.19.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.2.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.2.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.2.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.2.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.2.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.2.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.20.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.20.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.20.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.20.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.20.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.20.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.21.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.21.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.21.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.21.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.21.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.21.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.22.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.22.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.22.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.22.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.22.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.22.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.23.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.23.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.23.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.23.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.23.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.23.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.24.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.24.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.24.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.24.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.24.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.24.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.25.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.25.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.25.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.25.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.25.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.25.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.26.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.26.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.26.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.26.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.26.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.26.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.27.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.27.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.27.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.27.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.27.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.27.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.28.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.28.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.28.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.28.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.28.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.28.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.29.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.29.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.29.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.29.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.29.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.29.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.3.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.3.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.3.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.3.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.3.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.3.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.30.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.30.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.30.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.30.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.30.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.30.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.31.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.31.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.31.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.31.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.31.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.31.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.32.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.32.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.32.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.32.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.32.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.32.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.33.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.33.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.33.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.33.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.33.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.33.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.34.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.34.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.34.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.34.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.34.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.34.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.35.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.35.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.35.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.35.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.35.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.35.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.36.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.36.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.36.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.36.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.36.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.36.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.37.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.37.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.37.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.37.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.37.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.37.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.38.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.38.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.38.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.38.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.38.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.38.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.39.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.39.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.39.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.39.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.39.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.39.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.4.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.4.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.4.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.4.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.4.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.4.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.40.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.40.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.40.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.40.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.40.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.40.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.41.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.41.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.41.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.41.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.41.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.41.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.42.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.42.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.42.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.42.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.42.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.42.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.43.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.43.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.43.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.43.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.43.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.43.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.44.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.44.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.44.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.44.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.44.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.44.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.45.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.45.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.45.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.45.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.45.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.45.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.46.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.46.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.46.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.46.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.46.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.46.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.47.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.47.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.47.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.47.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.47.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.47.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.48.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.48.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.48.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.48.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.48.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.48.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.49.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.49.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.49.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.49.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.49.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.49.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.5.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.5.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.5.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.5.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.5.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.5.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.50.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.50.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.50.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.50.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.50.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.50.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.51.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.51.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.51.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.51.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.51.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.51.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.52.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.52.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.52.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.52.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.52.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.52.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.53.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.53.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.53.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.53.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.53.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.53.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.54.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.54.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.54.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.54.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.54.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.54.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.55.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.55.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.55.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.55.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.55.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.55.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.56.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.56.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.56.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.56.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.56.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.56.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.57.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.57.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.57.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.57.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.57.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.57.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.58.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.58.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.58.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.58.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.58.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.58.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.59.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.59.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.59.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.59.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.59.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.59.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.6.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.6.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.6.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.6.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.6.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.6.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.60.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.60.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.60.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.60.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.60.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.60.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.61.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.61.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.61.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.61.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.61.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.61.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.62.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.62.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.62.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.62.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.62.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.62.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.63.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.63.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.63.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.63.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.63.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.63.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.64.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.64.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.64.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.64.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.64.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.64.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.65.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.65.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.65.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.65.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.65.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.65.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.66.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.66.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.66.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.66.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.66.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.66.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.67.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.67.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.67.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.67.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.67.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.67.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.68.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.68.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.68.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.68.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.68.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.68.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.69.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.69.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.69.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.69.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.69.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.69.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.7.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.7.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.7.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.7.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.7.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.7.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.70.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.70.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.70.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.70.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.70.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.70.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.71.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.71.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.71.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.71.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.71.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.71.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.72.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.72.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.72.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.72.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.72.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.72.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.73.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.73.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.73.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.73.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.73.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.73.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.74.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.74.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.74.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.74.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.74.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.74.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.75.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.75.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.75.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.75.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.75.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.75.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.76.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.76.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.76.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.76.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.76.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.76.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.77.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.77.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.77.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.77.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.77.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.77.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.78.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.78.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.78.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.78.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.78.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.78.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.79.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.79.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.79.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.79.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.79.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.79.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.8.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.8.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.8.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.8.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.8.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.8.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.80.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.80.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.80.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.80.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.80.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.80.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.81.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.81.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.81.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.81.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.81.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.81.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.82.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.82.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.82.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.82.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.82.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.82.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.83.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.83.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.83.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.83.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.83.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.83.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.84.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.84.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.84.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.84.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.84.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.84.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.85.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.85.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.85.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.85.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.85.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.85.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.86.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.86.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.86.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.86.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.86.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.86.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.87.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.87.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.87.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.87.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.87.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.87.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.88.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.88.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.88.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.88.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.88.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.88.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.89.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.89.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.89.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.89.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.89.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.89.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.9.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.9.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.9.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.9.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.9.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.9.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.90.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.90.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.90.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.90.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.90.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.90.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.91.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.91.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.91.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.91.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.91.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.91.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.92.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.92.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.92.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.92.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.92.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.92.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.93.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.93.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.93.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.93.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.93.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.93.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.94.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.94.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.94.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.94.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.94.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.94.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.95.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.95.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.95.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.95.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.95.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.95.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.96.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.96.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.96.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.96.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.96.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.96.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.97.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.97.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.97.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.97.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.97.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.97.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.98.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.98.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.98.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.98.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.98.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.98.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.99.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.99.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.99.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.99.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.99.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.experts.99.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.gate.e_score_correction_bias": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.gate.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.shared_experts.down_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.shared_experts.down_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.shared_experts.gate_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.shared_experts.gate_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.shared_experts.up_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.mlp.shared_experts.up_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.post_attention_layernorm.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.self_attn.k_norm.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.self_attn.k_proj.bias": "model-00073-of-00092.safetensors",
+ "model.layers.72.self_attn.k_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.self_attn.k_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.self_attn.o_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.self_attn.o_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.self_attn.q_norm.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.self_attn.q_proj.bias": "model-00073-of-00092.safetensors",
+ "model.layers.72.self_attn.q_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.self_attn.q_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.72.self_attn.v_proj.bias": "model-00073-of-00092.safetensors",
+ "model.layers.72.self_attn.v_proj.weight": "model-00073-of-00092.safetensors",
+ "model.layers.72.self_attn.v_proj.weight_scale": "model-00073-of-00092.safetensors",
+ "model.layers.73.input_layernorm.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.0.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.0.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.0.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.0.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.0.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.0.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.1.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.1.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.1.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.1.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.1.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.1.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.10.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.10.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.10.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.10.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.10.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.10.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.100.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.100.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.100.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.100.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.100.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.100.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.101.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.101.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.101.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.101.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.101.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.101.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.102.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.102.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.102.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.102.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.102.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.102.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.103.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.103.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.103.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.103.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.103.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.103.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.104.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.104.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.104.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.104.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.104.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.104.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.105.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.105.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.105.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.105.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.105.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.105.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.106.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.106.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.106.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.106.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.106.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.106.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.107.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.107.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.107.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.107.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.107.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.107.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.108.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.108.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.108.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.108.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.108.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.108.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.109.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.109.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.109.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.109.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.109.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.109.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.11.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.11.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.11.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.11.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.11.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.11.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.110.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.110.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.110.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.110.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.110.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.110.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.111.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.111.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.111.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.111.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.111.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.111.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.112.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.112.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.112.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.112.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.112.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.112.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.113.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.113.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.113.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.113.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.113.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.113.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.114.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.114.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.114.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.114.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.114.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.114.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.115.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.115.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.115.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.115.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.115.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.115.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.116.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.116.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.116.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.116.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.116.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.116.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.117.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.117.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.117.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.117.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.117.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.117.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.118.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.118.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.118.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.118.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.118.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.118.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.119.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.119.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.119.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.119.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.119.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.119.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.12.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.12.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.12.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.12.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.12.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.12.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.120.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.120.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.120.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.120.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.120.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.120.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.121.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.121.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.121.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.121.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.121.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.121.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.122.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.122.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.122.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.122.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.122.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.122.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.123.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.123.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.123.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.123.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.123.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.123.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.124.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.124.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.124.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.124.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.124.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.124.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.125.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.125.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.125.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.125.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.125.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.125.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.126.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.126.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.126.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.126.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.126.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.126.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.127.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.127.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.127.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.127.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.127.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.127.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.128.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.128.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.128.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.128.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.128.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.128.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.129.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.129.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.129.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.129.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.129.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.129.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.13.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.13.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.13.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.13.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.13.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.13.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.130.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.130.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.130.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.130.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.130.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.130.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.131.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.131.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.131.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.131.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.131.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.131.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.132.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.132.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.132.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.132.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.132.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.132.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.133.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.133.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.133.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.133.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.133.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.133.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.134.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.134.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.134.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.134.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.134.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.134.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.135.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.135.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.135.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.135.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.135.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.135.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.136.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.136.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.136.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.136.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.136.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.136.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.137.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.137.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.137.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.137.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.137.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.137.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.138.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.138.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.138.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.138.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.138.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.138.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.139.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.139.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.139.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.139.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.139.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.139.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.14.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.14.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.14.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.14.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.14.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.14.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.140.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.140.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.140.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.140.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.140.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.140.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.141.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.141.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.141.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.141.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.141.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.141.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.142.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.142.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.142.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.142.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.142.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.142.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.143.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.143.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.143.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.143.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.143.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.143.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.144.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.144.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.144.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.144.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.144.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.144.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.145.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.145.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.145.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.145.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.145.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.145.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.146.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.146.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.146.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.146.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.146.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.146.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.147.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.147.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.147.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.147.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.147.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.147.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.148.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.148.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.148.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.148.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.148.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.148.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.149.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.149.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.149.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.149.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.149.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.149.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.15.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.15.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.15.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.15.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.15.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.15.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.150.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.150.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.150.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.150.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.150.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.150.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.151.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.151.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.151.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.151.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.151.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.151.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.152.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.152.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.152.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.152.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.152.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.152.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.153.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.153.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.153.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.153.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.153.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.153.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.154.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.154.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.154.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.154.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.154.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.154.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.155.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.155.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.155.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.155.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.155.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.155.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.156.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.156.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.156.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.156.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.156.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.156.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.157.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.157.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.157.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.157.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.157.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.157.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.158.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.158.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.158.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.158.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.158.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.158.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.159.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.159.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.159.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.159.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.159.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.159.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.16.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.16.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.16.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.16.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.16.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.16.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.17.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.17.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.17.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.17.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.17.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.17.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.18.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.18.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.18.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.18.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.18.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.18.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.19.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.19.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.19.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.19.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.19.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.19.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.2.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.2.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.2.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.2.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.2.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.2.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.20.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.20.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.20.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.20.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.20.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.20.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.21.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.21.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.21.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.21.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.21.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.21.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.22.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.22.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.22.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.22.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.22.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.22.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.23.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.23.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.23.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.23.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.23.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.23.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.24.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.24.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.24.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.24.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.24.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.24.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.25.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.25.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.25.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.25.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.25.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.25.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.26.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.26.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.26.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.26.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.26.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.26.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.27.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.27.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.27.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.27.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.27.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.27.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.28.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.28.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.28.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.28.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.28.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.28.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.29.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.29.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.29.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.29.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.29.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.29.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.3.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.3.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.3.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.3.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.3.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.3.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.30.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.30.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.30.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.30.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.30.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.30.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.31.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.31.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.31.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.31.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.31.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.31.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.32.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.32.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.32.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.32.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.32.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.32.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.33.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.33.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.33.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.33.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.33.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.33.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.34.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.34.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.34.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.34.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.34.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.34.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.35.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.35.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.35.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.35.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.35.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.35.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.36.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.36.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.36.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.36.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.36.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.36.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.37.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.37.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.37.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.37.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.37.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.37.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.38.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.38.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.38.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.38.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.38.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.38.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.39.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.39.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.39.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.39.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.39.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.39.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.4.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.4.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.4.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.4.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.4.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.4.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.40.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.40.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.40.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.40.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.40.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.40.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.41.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.41.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.41.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.41.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.41.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.41.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.42.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.42.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.42.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.42.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.42.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.42.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.43.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.43.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.43.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.43.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.43.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.43.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.44.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.44.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.44.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.44.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.44.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.44.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.45.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.45.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.45.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.45.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.45.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.45.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.46.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.46.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.46.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.46.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.46.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.46.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.47.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.47.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.47.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.47.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.47.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.47.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.48.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.48.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.48.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.48.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.48.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.48.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.49.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.49.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.49.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.49.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.49.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.49.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.5.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.5.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.5.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.5.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.5.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.5.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.50.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.50.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.50.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.50.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.50.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.50.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.51.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.51.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.51.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.51.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.51.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.51.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.52.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.52.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.52.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.52.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.52.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.52.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.53.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.53.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.53.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.53.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.53.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.53.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.54.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.54.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.54.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.54.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.54.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.54.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.55.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.55.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.55.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.55.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.55.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.55.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.56.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.56.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.56.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.56.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.56.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.56.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.57.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.57.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.57.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.57.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.57.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.57.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.58.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.58.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.58.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.58.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.58.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.58.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.59.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.59.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.59.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.59.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.59.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.59.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.6.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.6.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.6.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.6.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.6.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.6.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.60.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.60.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.60.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.60.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.60.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.60.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.61.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.61.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.61.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.61.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.61.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.61.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.62.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.62.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.62.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.62.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.62.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.62.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.63.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.63.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.63.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.63.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.63.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.63.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.64.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.64.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.64.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.64.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.64.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.64.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.65.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.65.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.65.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.65.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.65.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.65.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.66.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.66.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.66.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.66.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.66.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.66.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.67.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.67.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.67.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.67.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.67.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.67.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.68.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.68.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.68.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.68.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.68.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.68.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.69.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.69.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.69.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.69.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.69.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.69.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.7.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.7.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.7.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.7.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.7.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.7.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.70.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.70.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.70.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.70.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.70.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.70.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.71.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.71.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.71.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.71.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.71.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.71.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.72.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.72.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.72.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.72.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.72.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.72.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.73.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.73.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.73.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.73.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.73.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.73.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.74.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.74.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.74.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.74.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.74.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.74.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.75.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.75.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.75.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.75.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.75.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.75.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.76.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.76.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.76.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.76.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.76.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.76.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.77.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.77.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.77.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.77.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.77.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.77.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.78.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.78.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.78.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.78.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.78.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.78.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.79.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.79.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.79.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.79.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.79.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.79.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.8.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.8.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.8.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.8.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.8.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.8.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.80.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.80.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.80.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.80.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.80.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.80.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.81.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.81.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.81.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.81.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.81.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.81.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.82.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.82.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.82.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.82.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.82.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.82.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.83.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.83.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.83.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.83.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.83.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.83.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.84.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.84.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.84.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.84.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.84.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.84.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.85.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.85.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.85.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.85.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.85.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.85.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.86.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.86.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.86.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.86.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.86.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.86.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.87.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.87.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.87.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.87.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.87.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.87.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.88.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.88.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.88.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.88.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.88.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.88.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.89.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.89.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.89.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.89.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.89.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.89.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.9.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.9.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.9.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.9.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.9.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.9.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.90.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.90.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.90.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.90.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.90.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.90.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.91.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.91.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.91.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.91.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.91.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.91.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.92.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.92.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.92.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.92.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.92.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.92.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.93.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.93.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.93.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.93.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.93.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.93.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.94.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.94.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.94.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.94.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.94.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.94.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.95.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.95.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.95.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.95.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.95.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.95.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.96.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.96.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.96.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.96.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.96.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.96.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.97.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.97.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.97.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.97.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.97.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.97.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.98.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.98.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.98.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.98.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.98.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.98.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.99.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.99.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.99.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.99.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.99.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.experts.99.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.gate.e_score_correction_bias": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.gate.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.shared_experts.down_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.shared_experts.down_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.shared_experts.gate_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.shared_experts.gate_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.shared_experts.up_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.mlp.shared_experts.up_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.post_attention_layernorm.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.self_attn.k_norm.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.self_attn.k_proj.bias": "model-00074-of-00092.safetensors",
+ "model.layers.73.self_attn.k_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.self_attn.k_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.self_attn.o_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.self_attn.o_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.self_attn.q_norm.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.self_attn.q_proj.bias": "model-00074-of-00092.safetensors",
+ "model.layers.73.self_attn.q_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.self_attn.q_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.73.self_attn.v_proj.bias": "model-00074-of-00092.safetensors",
+ "model.layers.73.self_attn.v_proj.weight": "model-00074-of-00092.safetensors",
+ "model.layers.73.self_attn.v_proj.weight_scale": "model-00074-of-00092.safetensors",
+ "model.layers.74.input_layernorm.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.0.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.0.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.0.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.0.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.0.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.0.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.1.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.1.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.1.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.1.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.1.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.1.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.10.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.10.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.10.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.10.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.10.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.10.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.100.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.100.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.100.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.100.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.100.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.100.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.101.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.101.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.101.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.101.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.101.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.101.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.102.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.102.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.102.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.102.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.102.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.102.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.103.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.103.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.103.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.103.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.103.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.103.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.104.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.104.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.104.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.104.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.104.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.104.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.105.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.105.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.105.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.105.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.105.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.105.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.106.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.106.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.106.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.106.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.106.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.106.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.107.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.107.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.107.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.107.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.107.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.107.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.108.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.108.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.108.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.108.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.108.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.108.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.109.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.109.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.109.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.109.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.109.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.109.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.11.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.11.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.11.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.11.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.11.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.11.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.110.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.110.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.110.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.110.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.110.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.110.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.111.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.111.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.111.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.111.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.111.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.111.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.112.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.112.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.112.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.112.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.112.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.112.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.113.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.113.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.113.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.113.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.113.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.113.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.114.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.114.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.114.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.114.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.114.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.114.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.115.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.115.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.115.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.115.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.115.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.115.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.116.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.116.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.116.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.116.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.116.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.116.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.117.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.117.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.117.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.117.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.117.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.117.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.118.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.118.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.118.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.118.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.118.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.118.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.119.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.119.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.119.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.119.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.119.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.119.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.12.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.12.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.12.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.12.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.12.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.12.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.120.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.120.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.120.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.120.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.120.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.120.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.121.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.121.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.121.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.121.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.121.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.121.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.122.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.122.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.122.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.122.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.122.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.122.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.123.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.123.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.123.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.123.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.123.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.123.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.124.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.124.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.124.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.124.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.124.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.124.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.125.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.125.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.125.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.125.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.125.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.125.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.126.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.126.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.126.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.126.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.126.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.126.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.127.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.127.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.127.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.127.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.127.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.127.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.128.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.128.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.128.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.128.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.128.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.128.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.129.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.129.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.129.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.129.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.129.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.129.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.13.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.13.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.13.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.13.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.13.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.13.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.130.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.130.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.130.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.130.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.130.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.130.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.131.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.131.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.131.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.131.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.131.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.131.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.132.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.132.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.132.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.132.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.132.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.132.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.133.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.133.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.133.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.133.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.133.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.133.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.134.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.134.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.134.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.134.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.134.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.134.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.135.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.135.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.135.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.135.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.135.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.135.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.136.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.136.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.136.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.136.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.136.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.136.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.137.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.137.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.137.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.137.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.137.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.137.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.138.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.138.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.138.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.138.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.138.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.138.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.139.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.139.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.139.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.139.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.139.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.139.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.14.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.14.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.14.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.14.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.14.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.14.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.140.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.140.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.140.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.140.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.140.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.140.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.141.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.141.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.141.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.141.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.141.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.141.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.142.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.142.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.142.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.142.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.142.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.142.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.143.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.143.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.143.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.143.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.143.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.143.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.144.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.144.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.144.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.144.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.144.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.144.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.145.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.145.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.145.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.145.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.145.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.145.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.146.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.146.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.146.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.146.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.146.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.146.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.147.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.147.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.147.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.147.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.147.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.147.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.148.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.148.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.148.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.148.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.148.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.148.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.149.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.149.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.149.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.149.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.149.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.149.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.15.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.15.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.15.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.15.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.15.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.15.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.150.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.150.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.150.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.150.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.150.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.150.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.151.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.151.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.151.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.151.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.151.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.151.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.152.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.152.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.152.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.152.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.152.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.152.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.153.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.153.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.153.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.153.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.153.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.153.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.154.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.154.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.154.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.154.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.154.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.154.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.155.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.155.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.155.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.155.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.155.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.155.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.156.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.156.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.156.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.156.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.156.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.156.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.157.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.157.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.157.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.157.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.157.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.157.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.158.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.158.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.158.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.158.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.158.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.158.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.159.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.159.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.159.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.159.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.159.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.159.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.16.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.16.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.16.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.16.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.16.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.16.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.17.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.17.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.17.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.17.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.17.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.17.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.18.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.18.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.18.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.18.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.18.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.18.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.19.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.19.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.19.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.19.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.19.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.19.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.2.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.2.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.2.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.2.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.2.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.2.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.20.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.20.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.20.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.20.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.20.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.20.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.21.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.21.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.21.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.21.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.21.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.21.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.22.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.22.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.22.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.22.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.22.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.22.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.23.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.23.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.23.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.23.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.23.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.23.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.24.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.24.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.24.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.24.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.24.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.24.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.25.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.25.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.25.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.25.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.25.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.25.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.26.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.26.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.26.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.26.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.26.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.26.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.27.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.27.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.27.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.27.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.27.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.27.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.28.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.28.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.28.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.28.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.28.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.28.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.29.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.29.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.29.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.29.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.29.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.29.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.3.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.3.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.3.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.3.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.3.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.3.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.30.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.30.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.30.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.30.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.30.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.30.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.31.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.31.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.31.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.31.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.31.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.31.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.32.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.32.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.32.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.32.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.32.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.32.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.33.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.33.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.33.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.33.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.33.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.33.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.34.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.34.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.34.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.34.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.34.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.34.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.35.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.35.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.35.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.35.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.35.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.35.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.36.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.36.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.36.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.36.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.36.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.36.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.37.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.37.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.37.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.37.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.37.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.37.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.38.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.38.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.38.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.38.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.38.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.38.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.39.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.39.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.39.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.39.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.39.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.39.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.4.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.4.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.4.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.4.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.4.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.4.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.40.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.40.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.40.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.40.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.40.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.40.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.41.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.41.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.41.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.41.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.41.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.41.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.42.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.42.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.42.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.42.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.42.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.42.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.43.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.43.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.43.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.43.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.43.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.43.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.44.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.44.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.44.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.44.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.44.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.44.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.45.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.45.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.45.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.45.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.45.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.45.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.46.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.46.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.46.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.46.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.46.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.46.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.47.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.47.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.47.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.47.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.47.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.47.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.48.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.48.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.48.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.48.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.48.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.48.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.49.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.49.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.49.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.49.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.49.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.49.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.5.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.5.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.5.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.5.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.5.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.5.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.50.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.50.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.50.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.50.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.50.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.50.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.51.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.51.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.51.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.51.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.51.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.51.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.52.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.52.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.52.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.52.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.52.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.52.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.53.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.53.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.53.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.53.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.53.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.53.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.54.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.54.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.54.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.54.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.54.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.54.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.55.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.55.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.55.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.55.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.55.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.55.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.56.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.56.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.56.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.56.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.56.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.56.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.57.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.57.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.57.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.57.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.57.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.57.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.58.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.58.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.58.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.58.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.58.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.58.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.59.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.59.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.59.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.59.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.59.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.59.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.6.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.6.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.6.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.6.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.6.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.6.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.60.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.60.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.60.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.60.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.60.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.60.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.61.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.61.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.61.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.61.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.61.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.61.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.62.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.62.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.62.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.62.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.62.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.62.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.63.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.63.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.63.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.63.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.63.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.63.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.64.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.64.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.64.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.64.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.64.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.64.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.65.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.65.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.65.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.65.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.65.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.65.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.66.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.66.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.66.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.66.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.66.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.66.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.67.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.67.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.67.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.67.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.67.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.67.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.68.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.68.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.68.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.68.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.68.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.68.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.69.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.69.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.69.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.69.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.69.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.69.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.7.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.7.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.7.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.7.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.7.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.7.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.70.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.70.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.70.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.70.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.70.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.70.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.71.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.71.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.71.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.71.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.71.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.71.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.72.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.72.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.72.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.72.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.72.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.72.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.73.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.73.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.73.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.73.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.73.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.73.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.74.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.74.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.74.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.74.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.74.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.74.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.75.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.75.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.75.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.75.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.75.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.75.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.76.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.76.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.76.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.76.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.76.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.76.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.77.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.77.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.77.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.77.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.77.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.77.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.78.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.78.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.78.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.78.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.78.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.78.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.79.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.79.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.79.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.79.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.79.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.79.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.8.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.8.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.8.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.8.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.8.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.8.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.80.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.80.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.80.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.80.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.80.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.80.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.81.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.81.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.81.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.81.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.81.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.81.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.82.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.82.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.82.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.82.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.82.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.82.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.83.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.83.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.83.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.83.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.83.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.83.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.84.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.84.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.84.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.84.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.84.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.84.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.85.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.85.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.85.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.85.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.85.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.85.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.86.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.86.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.86.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.86.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.86.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.86.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.87.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.87.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.87.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.87.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.87.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.87.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.88.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.88.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.88.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.88.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.88.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.88.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.89.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.89.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.89.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.89.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.89.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.89.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.9.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.9.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.9.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.9.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.9.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.9.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.90.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.90.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.90.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.90.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.90.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.90.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.91.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.91.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.91.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.91.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.91.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.91.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.92.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.92.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.92.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.92.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.92.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.92.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.93.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.93.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.93.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.93.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.93.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.93.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.94.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.94.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.94.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.94.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.94.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.94.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.95.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.95.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.95.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.95.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.95.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.95.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.96.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.96.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.96.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.96.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.96.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.96.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.97.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.97.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.97.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.97.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.97.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.97.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.98.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.98.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.98.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.98.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.98.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.98.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.99.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.99.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.99.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.99.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.99.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.experts.99.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.gate.e_score_correction_bias": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.gate.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.shared_experts.down_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.shared_experts.down_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.shared_experts.gate_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.shared_experts.gate_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.shared_experts.up_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.mlp.shared_experts.up_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.post_attention_layernorm.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.self_attn.k_norm.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.self_attn.k_proj.bias": "model-00075-of-00092.safetensors",
+ "model.layers.74.self_attn.k_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.self_attn.k_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.self_attn.o_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.self_attn.o_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.self_attn.q_norm.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.self_attn.q_proj.bias": "model-00075-of-00092.safetensors",
+ "model.layers.74.self_attn.q_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.self_attn.q_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.74.self_attn.v_proj.bias": "model-00075-of-00092.safetensors",
+ "model.layers.74.self_attn.v_proj.weight": "model-00075-of-00092.safetensors",
+ "model.layers.74.self_attn.v_proj.weight_scale": "model-00075-of-00092.safetensors",
+ "model.layers.75.input_layernorm.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.0.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.0.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.0.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.0.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.0.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.0.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.1.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.1.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.1.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.1.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.1.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.1.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.10.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.10.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.10.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.10.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.10.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.10.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.100.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.100.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.100.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.100.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.100.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.100.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.101.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.101.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.101.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.101.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.101.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.101.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.102.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.102.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.102.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.102.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.102.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.102.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.103.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.103.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.103.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.103.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.103.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.103.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.104.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.104.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.104.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.104.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.104.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.104.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.105.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.105.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.105.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.105.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.105.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.105.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.106.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.106.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.106.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.106.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.106.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.106.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.107.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.107.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.107.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.107.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.107.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.107.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.108.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.108.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.108.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.108.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.108.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.108.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.109.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.109.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.109.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.109.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.109.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.109.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.11.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.11.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.11.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.11.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.11.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.11.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.110.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.110.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.110.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.110.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.110.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.110.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.111.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.111.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.111.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.111.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.111.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.111.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.112.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.112.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.112.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.112.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.112.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.112.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.113.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.113.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.113.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.113.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.113.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.113.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.114.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.114.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.114.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.114.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.114.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.114.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.115.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.115.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.115.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.115.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.115.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.115.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.116.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.116.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.116.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.116.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.116.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.116.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.117.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.117.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.117.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.117.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.117.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.117.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.118.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.118.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.118.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.118.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.118.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.118.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.119.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.119.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.119.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.119.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.119.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.119.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.12.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.12.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.12.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.12.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.12.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.12.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.120.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.120.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.120.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.120.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.120.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.120.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.121.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.121.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.121.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.121.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.121.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.121.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.122.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.122.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.122.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.122.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.122.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.122.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.123.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.123.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.123.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.123.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.123.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.123.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.124.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.124.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.124.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.124.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.124.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.124.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.125.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.125.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.125.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.125.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.125.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.125.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.126.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.126.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.126.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.126.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.126.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.126.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.127.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.127.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.127.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.127.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.127.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.127.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.128.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.128.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.128.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.128.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.128.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.128.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.129.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.129.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.129.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.129.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.129.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.129.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.13.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.13.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.13.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.13.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.13.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.13.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.130.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.130.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.130.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.130.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.130.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.130.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.131.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.131.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.131.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.131.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.131.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.131.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.132.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.132.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.132.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.132.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.132.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.132.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.133.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.133.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.133.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.133.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.133.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.133.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.134.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.134.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.134.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.134.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.134.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.134.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.135.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.135.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.135.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.135.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.135.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.135.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.136.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.136.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.136.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.136.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.136.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.136.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.137.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.137.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.137.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.137.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.137.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.137.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.138.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.138.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.138.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.138.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.138.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.138.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.139.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.139.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.139.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.139.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.139.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.139.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.14.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.14.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.14.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.14.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.14.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.14.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.140.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.140.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.140.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.140.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.140.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.140.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.141.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.141.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.141.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.141.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.141.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.141.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.142.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.142.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.142.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.142.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.142.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.142.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.143.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.143.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.143.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.143.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.143.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.143.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.144.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.144.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.144.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.144.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.144.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.144.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.145.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.145.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.145.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.145.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.145.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.145.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.146.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.146.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.146.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.146.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.146.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.146.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.147.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.147.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.147.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.147.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.147.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.147.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.148.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.148.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.148.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.148.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.148.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.148.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.149.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.149.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.149.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.149.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.149.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.149.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.15.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.15.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.15.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.15.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.15.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.15.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.150.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.150.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.150.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.150.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.150.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.150.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.151.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.151.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.151.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.151.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.151.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.151.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.152.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.152.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.152.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.152.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.152.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.152.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.153.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.153.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.153.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.153.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.153.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.153.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.154.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.154.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.154.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.154.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.154.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.154.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.155.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.155.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.155.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.155.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.155.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.155.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.156.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.156.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.156.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.156.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.156.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.156.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.157.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.157.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.157.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.157.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.157.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.157.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.158.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.158.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.158.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.158.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.158.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.158.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.159.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.159.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.159.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.159.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.159.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.159.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.16.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.16.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.16.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.16.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.16.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.16.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.17.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.17.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.17.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.17.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.17.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.17.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.18.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.18.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.18.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.18.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.18.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.18.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.19.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.19.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.19.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.19.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.19.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.19.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.2.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.2.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.2.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.2.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.2.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.2.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.20.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.20.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.20.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.20.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.20.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.20.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.21.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.21.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.21.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.21.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.21.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.21.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.22.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.22.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.22.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.22.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.22.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.22.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.23.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.23.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.23.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.23.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.23.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.23.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.24.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.24.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.24.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.24.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.24.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.24.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.25.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.25.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.25.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.25.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.25.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.25.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.26.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.26.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.26.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.26.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.26.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.26.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.27.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.27.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.27.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.27.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.27.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.27.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.28.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.28.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.28.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.28.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.28.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.28.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.29.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.29.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.29.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.29.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.29.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.29.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.3.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.3.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.3.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.3.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.3.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.3.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.30.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.30.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.30.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.30.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.30.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.30.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.31.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.31.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.31.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.31.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.31.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.31.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.32.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.32.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.32.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.32.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.32.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.32.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.33.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.33.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.33.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.33.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.33.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.33.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.34.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.34.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.34.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.34.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.34.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.34.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.35.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.35.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.35.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.35.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.35.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.35.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.36.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.36.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.36.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.36.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.36.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.36.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.37.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.37.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.37.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.37.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.37.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.37.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.38.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.38.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.38.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.38.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.38.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.38.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.39.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.39.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.39.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.39.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.39.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.39.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.4.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.4.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.4.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.4.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.4.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.4.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.40.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.40.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.40.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.40.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.40.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.40.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.41.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.41.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.41.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.41.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.41.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.41.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.42.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.42.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.42.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.42.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.42.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.42.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.43.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.43.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.43.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.43.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.43.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.43.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.44.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.44.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.44.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.44.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.44.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.44.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.45.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.45.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.45.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.45.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.45.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.45.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.46.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.46.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.46.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.46.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.46.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.46.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.47.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.47.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.47.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.47.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.47.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.47.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.48.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.48.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.48.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.48.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.48.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.48.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.49.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.49.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.49.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.49.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.49.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.49.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.5.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.5.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.5.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.5.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.5.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.5.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.50.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.50.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.50.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.50.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.50.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.50.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.51.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.51.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.51.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.51.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.51.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.51.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.52.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.52.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.52.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.52.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.52.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.52.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.53.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.53.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.53.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.53.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.53.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.53.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.54.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.54.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.54.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.54.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.54.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.54.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.55.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.55.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.55.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.55.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.55.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.55.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.56.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.56.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.56.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.56.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.56.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.56.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.57.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.57.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.57.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.57.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.57.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.57.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.58.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.58.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.58.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.58.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.58.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.58.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.59.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.59.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.59.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.59.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.59.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.59.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.6.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.6.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.6.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.6.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.6.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.6.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.60.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.60.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.60.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.60.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.60.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.60.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.61.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.61.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.61.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.61.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.61.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.61.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.62.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.62.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.62.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.62.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.62.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.62.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.63.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.63.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.63.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.63.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.63.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.63.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.64.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.64.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.64.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.64.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.64.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.64.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.65.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.65.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.65.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.65.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.65.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.65.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.66.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.66.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.66.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.66.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.66.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.66.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.67.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.67.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.67.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.67.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.67.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.67.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.68.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.68.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.68.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.68.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.68.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.68.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.69.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.69.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.69.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.69.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.69.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.69.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.7.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.7.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.7.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.7.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.7.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.7.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.70.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.70.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.70.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.70.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.70.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.70.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.71.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.71.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.71.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.71.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.71.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.71.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.72.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.72.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.72.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.72.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.72.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.72.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.73.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.73.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.73.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.73.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.73.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.73.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.74.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.74.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.74.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.74.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.74.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.74.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.75.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.75.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.75.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.75.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.75.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.75.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.76.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.76.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.76.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.76.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.76.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.76.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.77.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.77.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.77.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.77.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.77.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.77.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.78.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.78.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.78.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.78.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.78.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.78.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.79.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.79.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.79.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.79.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.79.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.79.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.8.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.8.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.8.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.8.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.8.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.8.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.80.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.80.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.80.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.80.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.80.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.80.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.81.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.81.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.81.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.81.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.81.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.81.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.82.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.82.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.82.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.82.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.82.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.82.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.83.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.83.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.83.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.83.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.83.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.83.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.84.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.84.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.84.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.84.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.84.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.84.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.85.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.85.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.85.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.85.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.85.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.85.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.86.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.86.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.86.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.86.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.86.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.86.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.87.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.87.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.87.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.87.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.87.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.87.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.88.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.88.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.88.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.88.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.88.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.88.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.89.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.89.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.89.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.89.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.89.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.89.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.9.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.9.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.9.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.9.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.9.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.9.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.90.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.90.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.90.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.90.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.90.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.90.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.91.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.91.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.91.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.91.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.91.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.91.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.92.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.92.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.92.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.92.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.92.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.92.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.93.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.93.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.93.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.93.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.93.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.93.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.94.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.94.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.94.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.94.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.94.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.94.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.95.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.95.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.95.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.95.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.95.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.95.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.96.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.96.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.96.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.96.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.96.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.96.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.97.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.97.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.97.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.97.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.97.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.97.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.98.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.98.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.98.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.98.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.98.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.98.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.99.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.99.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.99.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.99.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.99.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.experts.99.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.gate.e_score_correction_bias": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.gate.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.shared_experts.down_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.shared_experts.down_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.shared_experts.gate_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.shared_experts.gate_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.shared_experts.up_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.mlp.shared_experts.up_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.post_attention_layernorm.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.self_attn.k_norm.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.self_attn.k_proj.bias": "model-00076-of-00092.safetensors",
+ "model.layers.75.self_attn.k_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.self_attn.k_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.self_attn.o_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.self_attn.o_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.self_attn.q_norm.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.self_attn.q_proj.bias": "model-00076-of-00092.safetensors",
+ "model.layers.75.self_attn.q_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.self_attn.q_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.75.self_attn.v_proj.bias": "model-00076-of-00092.safetensors",
+ "model.layers.75.self_attn.v_proj.weight": "model-00076-of-00092.safetensors",
+ "model.layers.75.self_attn.v_proj.weight_scale": "model-00076-of-00092.safetensors",
+ "model.layers.76.input_layernorm.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.0.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.0.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.0.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.0.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.0.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.0.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.1.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.1.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.1.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.1.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.1.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.1.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.10.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.10.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.10.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.10.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.10.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.10.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.100.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.100.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.100.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.100.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.100.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.100.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.101.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.101.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.101.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.101.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.101.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.101.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.102.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.102.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.102.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.102.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.102.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.102.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.103.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.103.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.103.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.103.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.103.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.103.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.104.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.104.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.104.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.104.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.104.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.104.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.105.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.105.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.105.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.105.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.105.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.105.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.106.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.106.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.106.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.106.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.106.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.106.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.107.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.107.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.107.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.107.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.107.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.107.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.108.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.108.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.108.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.108.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.108.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.108.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.109.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.109.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.109.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.109.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.109.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.109.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.11.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.11.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.11.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.11.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.11.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.11.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.110.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.110.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.110.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.110.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.110.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.110.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.111.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.111.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.111.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.111.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.111.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.111.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.112.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.112.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.112.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.112.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.112.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.112.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.113.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.113.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.113.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.113.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.113.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.113.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.114.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.114.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.114.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.114.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.114.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.114.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.115.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.115.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.115.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.115.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.115.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.115.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.116.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.116.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.116.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.116.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.116.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.116.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.117.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.117.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.117.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.117.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.117.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.117.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.118.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.118.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.118.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.118.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.118.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.118.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.119.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.119.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.119.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.119.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.119.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.119.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.12.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.12.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.12.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.12.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.12.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.12.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.120.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.120.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.120.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.120.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.120.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.120.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.121.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.121.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.121.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.121.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.121.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.121.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.122.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.122.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.122.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.122.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.122.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.122.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.123.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.123.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.123.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.123.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.123.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.123.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.124.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.124.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.124.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.124.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.124.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.124.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.125.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.125.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.125.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.125.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.125.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.125.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.126.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.126.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.126.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.126.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.126.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.126.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.127.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.127.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.127.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.127.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.127.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.127.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.128.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.128.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.128.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.128.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.128.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.128.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.129.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.129.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.129.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.129.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.129.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.129.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.13.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.13.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.13.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.13.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.13.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.13.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.130.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.130.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.130.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.130.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.130.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.130.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.131.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.131.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.131.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.131.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.131.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.131.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.132.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.132.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.132.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.132.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.132.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.132.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.133.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.133.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.133.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.133.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.133.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.133.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.134.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.134.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.134.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.134.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.134.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.134.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.135.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.135.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.135.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.135.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.135.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.135.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.136.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.136.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.136.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.136.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.136.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.136.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.137.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.137.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.137.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.137.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.137.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.137.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.138.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.138.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.138.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.138.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.138.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.138.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.139.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.139.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.139.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.139.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.139.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.139.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.14.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.14.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.14.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.14.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.14.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.14.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.140.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.140.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.140.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.140.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.140.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.140.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.141.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.141.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.141.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.141.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.141.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.141.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.142.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.142.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.142.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.142.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.142.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.142.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.143.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.143.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.143.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.143.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.143.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.143.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.144.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.144.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.144.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.144.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.144.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.144.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.145.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.145.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.145.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.145.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.145.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.145.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.146.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.146.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.146.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.146.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.146.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.146.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.147.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.147.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.147.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.147.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.147.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.147.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.148.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.148.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.148.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.148.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.148.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.148.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.149.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.149.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.149.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.149.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.149.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.149.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.15.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.15.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.15.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.15.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.15.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.15.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.150.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.150.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.150.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.150.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.150.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.150.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.151.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.151.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.151.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.151.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.151.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.151.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.152.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.152.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.152.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.152.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.152.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.152.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.153.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.153.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.153.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.153.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.153.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.153.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.154.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.154.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.154.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.154.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.154.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.154.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.155.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.155.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.155.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.155.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.155.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.155.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.156.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.156.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.156.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.156.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.156.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.156.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.157.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.157.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.157.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.157.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.157.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.157.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.158.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.158.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.158.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.158.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.158.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.158.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.159.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.159.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.159.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.159.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.159.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.159.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.16.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.16.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.16.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.16.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.16.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.16.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.17.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.17.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.17.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.17.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.17.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.17.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.18.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.18.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.18.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.18.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.18.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.18.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.19.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.19.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.19.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.19.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.19.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.19.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.2.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.2.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.2.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.2.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.2.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.2.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.20.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.20.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.20.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.20.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.20.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.20.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.21.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.21.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.21.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.21.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.21.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.21.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.22.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.22.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.22.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.22.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.22.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.22.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.23.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.23.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.23.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.23.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.23.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.23.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.24.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.24.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.24.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.24.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.24.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.24.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.25.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.25.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.25.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.25.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.25.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.25.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.26.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.26.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.26.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.26.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.26.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.26.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.27.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.27.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.27.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.27.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.27.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.27.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.28.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.28.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.28.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.28.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.28.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.28.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.29.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.29.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.29.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.29.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.29.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.29.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.3.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.3.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.3.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.3.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.3.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.3.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.30.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.30.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.30.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.30.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.30.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.30.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.31.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.31.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.31.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.31.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.31.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.31.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.32.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.32.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.32.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.32.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.32.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.32.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.33.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.33.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.33.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.33.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.33.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.33.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.34.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.34.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.34.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.34.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.34.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.34.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.35.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.35.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.35.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.35.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.35.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.35.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.36.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.36.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.36.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.36.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.36.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.36.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.37.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.37.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.37.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.37.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.37.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.37.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.38.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.38.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.38.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.38.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.38.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.38.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.39.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.39.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.39.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.39.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.39.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.39.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.4.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.4.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.4.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.4.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.4.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.4.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.40.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.40.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.40.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.40.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.40.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.40.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.41.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.41.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.41.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.41.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.41.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.41.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.42.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.42.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.42.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.42.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.42.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.42.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.43.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.43.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.43.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.43.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.43.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.43.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.44.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.44.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.44.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.44.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.44.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.44.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.45.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.45.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.45.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.45.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.45.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.45.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.46.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.46.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.46.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.46.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.46.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.46.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.47.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.47.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.47.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.47.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.47.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.47.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.48.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.48.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.48.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.48.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.48.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.48.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.49.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.49.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.49.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.49.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.49.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.49.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.5.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.5.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.5.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.5.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.5.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.5.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.50.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.50.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.50.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.50.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.50.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.50.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.51.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.51.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.51.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.51.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.51.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.51.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.52.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.52.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.52.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.52.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.52.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.52.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.53.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.53.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.53.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.53.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.53.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.53.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.54.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.54.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.54.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.54.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.54.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.54.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.55.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.55.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.55.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.55.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.55.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.55.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.56.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.56.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.56.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.56.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.56.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.56.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.57.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.57.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.57.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.57.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.57.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.57.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.58.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.58.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.58.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.58.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.58.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.58.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.59.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.59.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.59.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.59.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.59.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.59.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.6.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.6.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.6.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.6.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.6.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.6.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.60.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.60.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.60.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.60.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.60.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.60.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.61.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.61.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.61.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.61.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.61.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.61.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.62.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.62.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.62.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.62.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.62.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.62.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.63.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.63.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.63.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.63.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.63.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.63.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.64.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.64.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.64.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.64.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.64.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.64.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.65.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.65.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.65.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.65.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.65.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.65.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.66.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.66.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.66.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.66.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.66.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.66.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.67.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.67.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.67.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.67.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.67.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.67.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.68.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.68.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.68.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.68.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.68.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.68.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.69.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.69.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.69.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.69.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.69.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.69.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.7.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.7.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.7.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.7.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.7.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.7.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.70.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.70.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.70.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.70.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.70.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.70.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.71.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.71.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.71.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.71.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.71.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.71.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.72.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.72.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.72.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.72.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.72.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.72.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.73.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.73.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.73.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.73.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.73.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.73.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.74.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.74.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.74.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.74.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.74.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.74.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.75.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.75.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.75.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.75.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.75.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.75.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.76.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.76.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.76.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.76.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.76.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.76.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.77.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.77.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.77.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.77.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.77.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.77.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.78.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.78.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.78.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.78.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.78.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.78.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.79.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.79.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.79.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.79.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.79.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.79.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.8.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.8.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.8.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.8.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.8.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.8.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.80.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.80.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.80.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.80.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.80.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.80.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.81.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.81.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.81.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.81.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.81.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.81.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.82.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.82.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.82.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.82.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.82.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.82.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.83.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.83.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.83.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.83.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.83.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.83.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.84.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.84.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.84.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.84.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.84.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.84.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.85.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.85.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.85.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.85.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.85.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.85.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.86.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.86.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.86.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.86.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.86.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.86.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.87.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.87.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.87.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.87.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.87.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.87.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.88.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.88.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.88.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.88.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.88.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.88.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.89.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.89.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.89.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.89.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.89.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.89.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.9.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.9.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.9.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.9.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.9.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.9.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.90.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.90.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.90.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.90.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.90.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.90.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.91.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.91.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.91.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.91.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.91.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.91.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.92.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.92.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.92.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.92.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.92.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.92.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.93.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.93.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.93.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.93.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.93.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.93.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.94.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.94.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.94.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.94.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.94.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.94.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.95.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.95.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.95.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.95.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.95.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.95.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.96.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.96.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.96.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.96.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.96.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.96.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.97.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.97.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.97.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.97.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.97.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.97.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.98.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.98.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.98.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.98.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.98.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.98.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.99.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.99.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.99.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.99.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.99.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.experts.99.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.gate.e_score_correction_bias": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.gate.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.shared_experts.down_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.shared_experts.down_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.shared_experts.gate_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.shared_experts.gate_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.shared_experts.up_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.mlp.shared_experts.up_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.post_attention_layernorm.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.self_attn.k_norm.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.self_attn.k_proj.bias": "model-00077-of-00092.safetensors",
+ "model.layers.76.self_attn.k_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.self_attn.k_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.self_attn.o_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.self_attn.o_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.self_attn.q_norm.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.self_attn.q_proj.bias": "model-00077-of-00092.safetensors",
+ "model.layers.76.self_attn.q_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.self_attn.q_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.76.self_attn.v_proj.bias": "model-00077-of-00092.safetensors",
+ "model.layers.76.self_attn.v_proj.weight": "model-00077-of-00092.safetensors",
+ "model.layers.76.self_attn.v_proj.weight_scale": "model-00077-of-00092.safetensors",
+ "model.layers.77.input_layernorm.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.0.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.0.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.0.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.0.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.0.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.0.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.1.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.1.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.1.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.1.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.1.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.1.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.10.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.10.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.10.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.10.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.10.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.10.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.100.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.100.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.100.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.100.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.100.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.100.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.101.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.101.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.101.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.101.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.101.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.101.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.102.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.102.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.102.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.102.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.102.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.102.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.103.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.103.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.103.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.103.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.103.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.103.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.104.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.104.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.104.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.104.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.104.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.104.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.105.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.105.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.105.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.105.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.105.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.105.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.106.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.106.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.106.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.106.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.106.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.106.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.107.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.107.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.107.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.107.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.107.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.107.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.108.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.108.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.108.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.108.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.108.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.108.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.109.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.109.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.109.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.109.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.109.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.109.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.11.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.11.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.11.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.11.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.11.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.11.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.110.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.110.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.110.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.110.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.110.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.110.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.111.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.111.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.111.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.111.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.111.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.111.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.112.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.112.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.112.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.112.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.112.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.112.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.113.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.113.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.113.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.113.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.113.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.113.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.114.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.114.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.114.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.114.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.114.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.114.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.115.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.115.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.115.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.115.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.115.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.115.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.116.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.116.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.116.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.116.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.116.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.116.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.117.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.117.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.117.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.117.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.117.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.117.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.118.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.118.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.118.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.118.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.118.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.118.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.119.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.119.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.119.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.119.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.119.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.119.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.12.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.12.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.12.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.12.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.12.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.12.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.120.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.120.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.120.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.120.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.120.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.120.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.121.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.121.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.121.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.121.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.121.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.121.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.122.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.122.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.122.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.122.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.122.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.122.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.123.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.123.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.123.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.123.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.123.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.123.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.124.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.124.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.124.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.124.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.124.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.124.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.125.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.125.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.125.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.125.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.125.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.125.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.126.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.126.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.126.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.126.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.126.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.126.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.127.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.127.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.127.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.127.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.127.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.127.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.128.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.128.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.128.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.128.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.128.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.128.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.129.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.129.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.129.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.129.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.129.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.129.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.13.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.13.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.13.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.13.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.13.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.13.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.130.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.130.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.130.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.130.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.130.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.130.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.131.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.131.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.131.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.131.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.131.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.131.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.132.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.132.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.132.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.132.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.132.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.132.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.133.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.133.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.133.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.133.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.133.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.133.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.134.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.134.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.134.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.134.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.134.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.134.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.135.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.135.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.135.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.135.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.135.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.135.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.136.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.136.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.136.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.136.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.136.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.136.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.137.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.137.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.137.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.137.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.137.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.137.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.138.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.138.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.138.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.138.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.138.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.138.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.139.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.139.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.139.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.139.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.139.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.139.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.14.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.14.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.14.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.14.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.14.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.14.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.140.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.140.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.140.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.140.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.140.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.140.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.141.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.141.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.141.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.141.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.141.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.141.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.142.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.142.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.142.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.142.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.142.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.142.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.143.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.143.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.143.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.143.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.143.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.143.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.144.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.144.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.144.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.144.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.144.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.144.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.145.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.145.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.145.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.145.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.145.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.145.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.146.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.146.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.146.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.146.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.146.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.146.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.147.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.147.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.147.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.147.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.147.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.147.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.148.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.148.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.148.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.148.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.148.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.148.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.149.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.149.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.149.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.149.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.149.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.149.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.15.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.15.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.15.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.15.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.15.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.15.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.150.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.150.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.150.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.150.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.150.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.150.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.151.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.151.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.151.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.151.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.151.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.151.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.152.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.152.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.152.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.152.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.152.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.152.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.153.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.153.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.153.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.153.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.153.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.153.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.154.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.154.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.154.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.154.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.154.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.154.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.155.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.155.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.155.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.155.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.155.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.155.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.156.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.156.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.156.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.156.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.156.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.156.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.157.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.157.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.157.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.157.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.157.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.157.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.158.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.158.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.158.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.158.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.158.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.158.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.159.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.159.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.159.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.159.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.159.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.159.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.16.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.16.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.16.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.16.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.16.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.16.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.17.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.17.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.17.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.17.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.17.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.17.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.18.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.18.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.18.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.18.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.18.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.18.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.19.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.19.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.19.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.19.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.19.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.19.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.2.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.2.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.2.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.2.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.2.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.2.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.20.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.20.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.20.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.20.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.20.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.20.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.21.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.21.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.21.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.21.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.21.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.21.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.22.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.22.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.22.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.22.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.22.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.22.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.23.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.23.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.23.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.23.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.23.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.23.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.24.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.24.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.24.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.24.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.24.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.24.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.25.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.25.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.25.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.25.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.25.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.25.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.26.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.26.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.26.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.26.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.26.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.26.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.27.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.27.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.27.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.27.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.27.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.27.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.28.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.28.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.28.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.28.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.28.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.28.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.29.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.29.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.29.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.29.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.29.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.29.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.3.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.3.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.3.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.3.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.3.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.3.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.30.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.30.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.30.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.30.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.30.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.30.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.31.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.31.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.31.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.31.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.31.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.31.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.32.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.32.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.32.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.32.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.32.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.32.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.33.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.33.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.33.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.33.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.33.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.33.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.34.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.34.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.34.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.34.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.34.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.34.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.35.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.35.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.35.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.35.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.35.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.35.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.36.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.36.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.36.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.36.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.36.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.36.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.37.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.37.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.37.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.37.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.37.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.37.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.38.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.38.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.38.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.38.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.38.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.38.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.39.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.39.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.39.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.39.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.39.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.39.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.4.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.4.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.4.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.4.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.4.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.4.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.40.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.40.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.40.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.40.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.40.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.40.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.41.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.41.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.41.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.41.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.41.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.41.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.42.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.42.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.42.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.42.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.42.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.42.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.43.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.43.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.43.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.43.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.43.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.43.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.44.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.44.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.44.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.44.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.44.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.44.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.45.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.45.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.45.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.45.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.45.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.45.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.46.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.46.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.46.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.46.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.46.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.46.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.47.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.47.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.47.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.47.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.47.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.47.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.48.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.48.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.48.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.48.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.48.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.48.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.49.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.49.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.49.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.49.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.49.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.49.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.5.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.5.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.5.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.5.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.5.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.5.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.50.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.50.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.50.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.50.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.50.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.50.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.51.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.51.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.51.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.51.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.51.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.51.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.52.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.52.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.52.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.52.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.52.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.52.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.53.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.53.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.53.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.53.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.53.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.53.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.54.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.54.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.54.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.54.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.54.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.54.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.55.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.55.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.55.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.55.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.55.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.55.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.56.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.56.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.56.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.56.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.56.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.56.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.57.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.57.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.57.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.57.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.57.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.57.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.58.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.58.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.58.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.58.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.58.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.58.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.59.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.59.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.59.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.59.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.59.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.59.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.6.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.6.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.6.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.6.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.6.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.6.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.60.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.60.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.60.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.60.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.60.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.60.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.61.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.61.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.61.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.61.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.61.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.61.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.62.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.62.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.62.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.62.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.62.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.62.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.63.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.63.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.63.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.63.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.63.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.63.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.64.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.64.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.64.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.64.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.64.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.64.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.65.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.65.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.65.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.65.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.65.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.65.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.66.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.66.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.66.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.66.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.66.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.66.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.67.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.67.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.67.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.67.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.67.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.67.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.68.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.68.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.68.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.68.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.68.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.68.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.69.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.69.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.69.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.69.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.69.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.69.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.7.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.7.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.7.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.7.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.7.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.7.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.70.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.70.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.70.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.70.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.70.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.70.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.71.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.71.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.71.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.71.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.71.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.71.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.72.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.72.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.72.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.72.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.72.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.72.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.73.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.73.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.73.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.73.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.73.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.73.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.74.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.74.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.74.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.74.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.74.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.74.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.75.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.75.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.75.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.75.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.75.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.75.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.76.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.76.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.76.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.76.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.76.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.76.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.77.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.77.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.77.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.77.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.77.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.77.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.78.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.78.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.78.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.78.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.78.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.78.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.79.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.79.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.79.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.79.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.79.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.79.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.8.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.8.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.8.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.8.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.8.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.8.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.80.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.80.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.80.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.80.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.80.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.80.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.81.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.81.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.81.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.81.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.81.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.81.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.82.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.82.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.82.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.82.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.82.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.82.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.83.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.83.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.83.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.83.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.83.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.83.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.84.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.84.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.84.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.84.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.84.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.84.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.85.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.85.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.85.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.85.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.85.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.85.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.86.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.86.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.86.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.86.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.86.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.86.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.87.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.87.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.87.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.87.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.87.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.87.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.88.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.88.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.88.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.88.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.88.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.88.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.89.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.89.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.89.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.89.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.89.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.89.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.9.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.9.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.9.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.9.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.9.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.9.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.90.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.90.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.90.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.90.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.90.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.90.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.91.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.91.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.91.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.91.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.91.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.91.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.92.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.92.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.92.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.92.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.92.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.92.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.93.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.93.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.93.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.93.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.93.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.93.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.94.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.94.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.94.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.94.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.94.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.94.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.95.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.95.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.95.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.95.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.95.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.95.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.96.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.96.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.96.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.96.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.96.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.96.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.97.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.97.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.97.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.97.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.97.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.97.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.98.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.98.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.98.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.98.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.98.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.98.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.99.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.99.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.99.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.99.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.99.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.experts.99.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.gate.e_score_correction_bias": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.gate.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.shared_experts.down_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.shared_experts.down_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.shared_experts.gate_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.shared_experts.gate_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.shared_experts.up_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.mlp.shared_experts.up_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.post_attention_layernorm.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.self_attn.k_norm.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.self_attn.k_proj.bias": "model-00078-of-00092.safetensors",
+ "model.layers.77.self_attn.k_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.self_attn.k_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.self_attn.o_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.self_attn.o_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.self_attn.q_norm.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.self_attn.q_proj.bias": "model-00078-of-00092.safetensors",
+ "model.layers.77.self_attn.q_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.self_attn.q_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.77.self_attn.v_proj.bias": "model-00078-of-00092.safetensors",
+ "model.layers.77.self_attn.v_proj.weight": "model-00078-of-00092.safetensors",
+ "model.layers.77.self_attn.v_proj.weight_scale": "model-00078-of-00092.safetensors",
+ "model.layers.78.input_layernorm.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.0.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.0.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.0.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.0.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.0.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.0.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.1.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.1.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.1.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.1.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.1.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.1.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.10.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.10.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.10.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.10.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.10.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.10.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.100.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.100.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.100.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.100.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.100.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.100.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.101.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.101.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.101.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.101.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.101.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.101.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.102.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.102.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.102.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.102.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.102.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.102.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.103.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.103.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.103.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.103.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.103.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.103.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.104.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.104.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.104.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.104.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.104.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.104.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.105.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.105.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.105.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.105.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.105.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.105.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.106.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.106.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.106.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.106.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.106.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.106.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.107.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.107.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.107.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.107.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.107.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.107.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.108.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.108.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.108.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.108.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.108.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.108.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.109.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.109.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.109.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.109.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.109.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.109.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.11.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.11.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.11.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.11.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.11.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.11.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.110.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.110.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.110.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.110.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.110.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.110.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.111.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.111.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.111.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.111.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.111.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.111.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.112.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.112.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.112.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.112.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.112.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.112.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.113.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.113.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.113.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.113.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.113.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.113.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.114.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.114.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.114.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.114.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.114.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.114.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.115.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.115.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.115.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.115.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.115.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.115.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.116.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.116.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.116.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.116.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.116.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.116.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.117.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.117.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.117.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.117.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.117.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.117.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.118.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.118.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.118.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.118.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.118.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.118.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.119.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.119.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.119.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.119.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.119.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.119.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.12.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.12.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.12.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.12.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.12.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.12.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.120.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.120.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.120.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.120.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.120.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.120.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.121.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.121.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.121.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.121.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.121.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.121.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.122.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.122.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.122.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.122.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.122.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.122.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.123.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.123.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.123.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.123.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.123.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.123.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.124.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.124.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.124.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.124.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.124.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.124.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.125.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.125.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.125.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.125.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.125.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.125.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.126.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.126.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.126.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.126.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.126.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.126.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.127.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.127.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.127.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.127.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.127.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.127.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.128.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.128.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.128.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.128.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.128.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.128.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.129.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.129.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.129.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.129.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.129.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.129.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.13.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.13.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.13.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.13.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.13.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.13.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.130.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.130.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.130.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.130.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.130.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.130.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.131.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.131.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.131.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.131.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.131.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.131.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.132.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.132.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.132.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.132.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.132.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.132.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.133.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.133.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.133.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.133.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.133.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.133.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.134.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.134.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.134.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.134.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.134.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.134.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.135.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.135.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.135.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.135.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.135.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.135.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.136.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.136.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.136.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.136.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.136.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.136.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.137.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.137.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.137.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.137.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.137.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.137.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.138.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.138.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.138.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.138.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.138.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.138.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.139.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.139.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.139.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.139.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.139.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.139.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.14.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.14.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.14.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.14.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.14.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.14.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.140.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.140.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.140.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.140.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.140.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.140.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.141.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.141.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.141.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.141.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.141.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.141.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.142.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.142.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.142.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.142.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.142.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.142.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.143.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.143.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.143.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.143.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.143.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.143.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.144.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.144.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.144.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.144.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.144.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.144.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.145.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.145.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.145.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.145.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.145.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.145.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.146.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.146.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.146.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.146.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.146.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.146.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.147.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.147.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.147.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.147.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.147.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.147.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.148.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.148.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.148.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.148.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.148.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.148.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.149.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.149.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.149.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.149.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.149.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.149.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.15.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.15.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.15.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.15.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.15.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.15.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.150.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.150.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.150.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.150.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.150.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.150.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.151.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.151.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.151.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.151.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.151.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.151.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.152.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.152.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.152.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.152.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.152.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.152.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.153.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.153.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.153.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.153.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.153.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.153.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.154.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.154.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.154.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.154.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.154.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.154.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.155.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.155.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.155.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.155.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.155.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.155.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.156.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.156.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.156.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.156.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.156.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.156.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.157.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.157.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.157.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.157.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.157.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.157.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.158.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.158.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.158.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.158.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.158.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.158.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.159.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.159.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.159.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.159.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.159.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.159.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.16.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.16.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.16.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.16.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.16.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.16.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.17.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.17.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.17.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.17.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.17.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.17.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.18.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.18.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.18.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.18.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.18.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.18.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.19.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.19.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.19.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.19.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.19.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.19.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.2.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.2.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.2.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.2.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.2.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.2.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.20.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.20.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.20.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.20.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.20.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.20.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.21.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.21.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.21.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.21.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.21.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.21.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.22.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.22.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.22.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.22.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.22.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.22.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.23.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.23.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.23.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.23.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.23.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.23.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.24.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.24.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.24.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.24.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.24.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.24.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.25.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.25.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.25.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.25.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.25.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.25.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.26.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.26.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.26.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.26.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.26.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.26.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.27.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.27.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.27.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.27.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.27.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.27.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.28.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.28.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.28.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.28.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.28.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.28.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.29.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.29.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.29.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.29.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.29.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.29.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.3.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.3.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.3.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.3.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.3.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.3.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.30.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.30.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.30.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.30.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.30.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.30.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.31.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.31.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.31.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.31.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.31.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.31.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.32.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.32.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.32.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.32.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.32.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.32.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.33.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.33.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.33.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.33.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.33.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.33.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.34.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.34.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.34.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.34.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.34.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.34.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.35.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.35.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.35.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.35.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.35.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.35.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.36.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.36.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.36.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.36.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.36.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.36.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.37.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.37.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.37.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.37.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.37.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.37.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.38.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.38.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.38.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.38.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.38.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.38.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.39.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.39.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.39.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.39.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.39.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.39.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.4.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.4.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.4.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.4.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.4.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.4.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.40.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.40.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.40.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.40.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.40.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.40.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.41.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.41.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.41.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.41.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.41.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.41.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.42.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.42.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.42.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.42.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.42.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.42.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.43.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.43.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.43.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.43.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.43.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.43.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.44.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.44.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.44.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.44.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.44.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.44.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.45.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.45.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.45.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.45.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.45.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.45.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.46.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.46.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.46.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.46.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.46.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.46.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.47.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.47.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.47.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.47.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.47.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.47.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.48.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.48.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.48.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.48.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.48.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.48.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.49.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.49.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.49.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.49.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.49.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.49.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.5.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.5.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.5.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.5.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.5.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.5.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.50.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.50.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.50.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.50.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.50.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.50.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.51.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.51.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.51.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.51.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.51.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.51.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.52.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.52.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.52.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.52.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.52.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.52.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.53.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.53.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.53.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.53.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.53.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.53.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.54.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.54.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.54.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.54.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.54.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.54.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.55.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.55.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.55.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.55.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.55.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.55.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.56.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.56.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.56.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.56.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.56.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.56.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.57.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.57.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.57.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.57.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.57.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.57.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.58.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.58.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.58.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.58.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.58.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.58.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.59.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.59.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.59.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.59.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.59.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.59.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.6.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.6.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.6.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.6.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.6.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.6.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.60.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.60.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.60.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.60.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.60.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.60.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.61.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.61.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.61.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.61.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.61.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.61.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.62.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.62.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.62.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.62.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.62.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.62.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.63.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.63.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.63.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.63.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.63.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.63.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.64.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.64.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.64.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.64.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.64.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.64.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.65.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.65.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.65.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.65.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.65.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.65.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.66.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.66.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.66.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.66.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.66.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.66.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.67.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.67.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.67.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.67.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.67.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.67.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.68.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.68.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.68.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.68.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.68.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.68.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.69.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.69.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.69.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.69.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.69.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.69.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.7.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.7.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.7.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.7.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.7.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.7.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.70.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.70.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.70.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.70.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.70.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.70.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.71.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.71.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.71.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.71.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.71.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.71.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.72.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.72.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.72.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.72.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.72.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.72.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.73.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.73.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.73.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.73.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.73.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.73.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.74.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.74.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.74.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.74.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.74.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.74.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.75.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.75.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.75.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.75.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.75.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.75.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.76.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.76.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.76.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.76.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.76.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.76.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.77.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.77.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.77.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.77.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.77.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.77.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.78.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.78.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.78.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.78.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.78.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.78.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.79.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.79.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.79.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.79.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.79.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.79.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.8.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.8.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.8.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.8.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.8.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.8.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.80.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.80.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.80.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.80.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.80.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.80.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.81.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.81.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.81.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.81.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.81.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.81.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.82.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.82.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.82.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.82.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.82.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.82.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.83.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.83.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.83.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.83.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.83.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.83.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.84.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.84.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.84.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.84.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.84.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.84.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.85.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.85.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.85.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.85.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.85.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.85.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.86.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.86.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.86.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.86.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.86.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.86.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.87.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.87.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.87.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.87.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.87.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.87.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.88.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.88.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.88.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.88.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.88.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.88.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.89.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.89.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.89.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.89.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.89.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.89.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.9.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.9.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.9.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.9.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.9.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.9.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.90.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.90.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.90.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.90.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.90.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.90.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.91.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.91.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.91.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.91.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.91.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.91.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.92.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.92.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.92.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.92.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.92.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.92.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.93.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.93.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.93.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.93.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.93.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.93.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.94.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.94.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.94.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.94.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.94.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.94.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.95.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.95.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.95.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.95.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.95.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.95.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.96.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.96.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.96.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.96.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.96.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.96.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.97.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.97.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.97.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.97.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.97.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.97.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.98.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.98.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.98.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.98.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.98.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.98.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.99.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.99.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.99.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.99.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.99.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.experts.99.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.gate.e_score_correction_bias": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.gate.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.shared_experts.down_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.shared_experts.down_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.shared_experts.gate_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.shared_experts.gate_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.shared_experts.up_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.mlp.shared_experts.up_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.post_attention_layernorm.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.self_attn.k_norm.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.self_attn.k_proj.bias": "model-00079-of-00092.safetensors",
+ "model.layers.78.self_attn.k_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.self_attn.k_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.self_attn.o_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.self_attn.o_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.self_attn.q_norm.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.self_attn.q_proj.bias": "model-00079-of-00092.safetensors",
+ "model.layers.78.self_attn.q_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.self_attn.q_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.78.self_attn.v_proj.bias": "model-00079-of-00092.safetensors",
+ "model.layers.78.self_attn.v_proj.weight": "model-00079-of-00092.safetensors",
+ "model.layers.78.self_attn.v_proj.weight_scale": "model-00079-of-00092.safetensors",
+ "model.layers.79.input_layernorm.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.0.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.0.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.0.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.0.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.0.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.0.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.1.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.1.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.1.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.1.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.1.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.1.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.10.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.10.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.10.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.10.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.10.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.10.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.100.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.100.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.100.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.100.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.100.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.100.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.101.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.101.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.101.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.101.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.101.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.101.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.102.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.102.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.102.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.102.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.102.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.102.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.103.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.103.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.103.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.103.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.103.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.103.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.104.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.104.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.104.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.104.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.104.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.104.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.105.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.105.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.105.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.105.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.105.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.105.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.106.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.106.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.106.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.106.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.106.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.106.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.107.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.107.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.107.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.107.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.107.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.107.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.108.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.108.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.108.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.108.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.108.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.108.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.109.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.109.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.109.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.109.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.109.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.109.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.11.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.11.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.11.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.11.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.11.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.11.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.110.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.110.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.110.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.110.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.110.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.110.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.111.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.111.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.111.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.111.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.111.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.111.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.112.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.112.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.112.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.112.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.112.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.112.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.113.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.113.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.113.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.113.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.113.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.113.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.114.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.114.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.114.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.114.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.114.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.114.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.115.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.115.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.115.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.115.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.115.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.115.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.116.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.116.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.116.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.116.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.116.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.116.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.117.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.117.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.117.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.117.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.117.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.117.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.118.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.118.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.118.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.118.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.118.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.118.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.119.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.119.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.119.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.119.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.119.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.119.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.12.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.12.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.12.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.12.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.12.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.12.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.120.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.120.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.120.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.120.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.120.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.120.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.121.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.121.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.121.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.121.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.121.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.121.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.122.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.122.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.122.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.122.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.122.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.122.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.123.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.123.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.123.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.123.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.123.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.123.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.124.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.124.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.124.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.124.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.124.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.124.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.125.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.125.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.125.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.125.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.125.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.125.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.126.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.126.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.126.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.126.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.126.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.126.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.127.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.127.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.127.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.127.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.127.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.127.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.128.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.128.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.128.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.128.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.128.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.128.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.129.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.129.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.129.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.129.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.129.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.129.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.13.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.13.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.13.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.13.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.13.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.13.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.130.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.130.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.130.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.130.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.130.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.130.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.131.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.131.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.131.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.131.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.131.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.131.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.132.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.132.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.132.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.132.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.132.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.132.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.133.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.133.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.133.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.133.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.133.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.133.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.134.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.134.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.134.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.134.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.134.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.134.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.135.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.135.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.135.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.135.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.135.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.135.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.136.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.136.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.136.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.136.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.136.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.136.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.137.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.137.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.137.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.137.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.137.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.137.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.138.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.138.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.138.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.138.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.138.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.138.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.139.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.139.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.139.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.139.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.139.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.139.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.14.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.14.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.14.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.14.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.14.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.14.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.140.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.140.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.140.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.140.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.140.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.140.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.141.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.141.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.141.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.141.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.141.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.141.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.142.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.142.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.142.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.142.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.142.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.142.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.143.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.143.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.143.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.143.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.143.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.143.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.144.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.144.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.144.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.144.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.144.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.144.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.145.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.145.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.145.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.145.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.145.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.145.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.146.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.146.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.146.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.146.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.146.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.146.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.147.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.147.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.147.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.147.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.147.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.147.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.148.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.148.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.148.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.148.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.148.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.148.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.149.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.149.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.149.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.149.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.149.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.149.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.15.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.15.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.15.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.15.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.15.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.15.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.150.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.150.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.150.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.150.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.150.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.150.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.151.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.151.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.151.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.151.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.151.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.151.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.152.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.152.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.152.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.152.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.152.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.152.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.153.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.153.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.153.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.153.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.153.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.153.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.154.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.154.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.154.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.154.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.154.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.154.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.155.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.155.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.155.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.155.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.155.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.155.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.156.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.156.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.156.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.156.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.156.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.156.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.157.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.157.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.157.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.157.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.157.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.157.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.158.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.158.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.158.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.158.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.158.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.158.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.159.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.159.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.159.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.159.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.159.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.159.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.16.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.16.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.16.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.16.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.16.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.16.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.17.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.17.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.17.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.17.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.17.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.17.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.18.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.18.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.18.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.18.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.18.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.18.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.19.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.19.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.19.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.19.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.19.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.19.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.2.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.2.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.2.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.2.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.2.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.2.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.20.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.20.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.20.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.20.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.20.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.20.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.21.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.21.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.21.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.21.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.21.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.21.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.22.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.22.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.22.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.22.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.22.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.22.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.23.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.23.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.23.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.23.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.23.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.23.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.24.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.24.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.24.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.24.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.24.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.24.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.25.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.25.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.25.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.25.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.25.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.25.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.26.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.26.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.26.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.26.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.26.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.26.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.27.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.27.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.27.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.27.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.27.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.27.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.28.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.28.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.28.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.28.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.28.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.28.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.29.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.29.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.29.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.29.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.29.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.29.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.3.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.3.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.3.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.3.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.3.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.3.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.30.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.30.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.30.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.30.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.30.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.30.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.31.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.31.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.31.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.31.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.31.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.31.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.32.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.32.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.32.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.32.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.32.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.32.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.33.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.33.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.33.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.33.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.33.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.33.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.34.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.34.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.34.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.34.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.34.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.34.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.35.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.35.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.35.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.35.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.35.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.35.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.36.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.36.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.36.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.36.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.36.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.36.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.37.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.37.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.37.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.37.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.37.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.37.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.38.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.38.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.38.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.38.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.38.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.38.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.39.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.39.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.39.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.39.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.39.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.39.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.4.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.4.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.4.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.4.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.4.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.4.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.40.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.40.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.40.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.40.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.40.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.40.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.41.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.41.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.41.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.41.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.41.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.41.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.42.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.42.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.42.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.42.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.42.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.42.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.43.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.43.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.43.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.43.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.43.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.43.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.44.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.44.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.44.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.44.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.44.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.44.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.45.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.45.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.45.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.45.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.45.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.45.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.46.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.46.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.46.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.46.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.46.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.46.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.47.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.47.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.47.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.47.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.47.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.47.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.48.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.48.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.48.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.48.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.48.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.48.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.49.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.49.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.49.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.49.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.49.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.49.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.5.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.5.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.5.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.5.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.5.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.5.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.50.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.50.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.50.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.50.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.50.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.50.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.51.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.51.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.51.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.51.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.51.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.51.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.52.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.52.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.52.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.52.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.52.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.52.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.53.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.53.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.53.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.53.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.53.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.53.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.54.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.54.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.54.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.54.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.54.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.54.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.55.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.55.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.55.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.55.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.55.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.55.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.56.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.56.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.56.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.56.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.56.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.56.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.57.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.57.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.57.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.57.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.57.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.57.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.58.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.58.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.58.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.58.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.58.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.58.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.59.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.59.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.59.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.59.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.59.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.59.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.6.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.6.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.6.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.6.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.6.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.6.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.60.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.60.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.60.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.60.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.60.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.60.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.61.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.61.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.61.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.61.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.61.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.61.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.62.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.62.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.62.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.62.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.62.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.62.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.63.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.63.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.63.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.63.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.63.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.63.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.64.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.64.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.64.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.64.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.64.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.64.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.65.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.65.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.65.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.65.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.65.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.65.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.66.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.66.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.66.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.66.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.66.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.66.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.67.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.67.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.67.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.67.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.67.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.67.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.68.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.68.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.68.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.68.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.68.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.68.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.69.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.69.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.69.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.69.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.69.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.69.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.7.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.7.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.7.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.7.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.7.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.7.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.70.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.70.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.70.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.70.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.70.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.70.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.71.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.71.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.71.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.71.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.71.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.71.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.72.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.72.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.72.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.72.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.72.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.72.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.73.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.73.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.73.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.73.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.73.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.73.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.74.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.74.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.74.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.74.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.74.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.74.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.75.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.75.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.75.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.75.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.75.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.75.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.76.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.76.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.76.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.76.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.76.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.76.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.77.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.77.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.77.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.77.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.77.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.77.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.78.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.78.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.78.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.78.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.78.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.78.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.79.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.79.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.79.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.79.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.79.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.79.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.8.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.8.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.8.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.8.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.8.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.8.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.80.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.80.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.80.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.80.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.80.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.80.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.81.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.81.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.81.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.81.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.81.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.81.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.82.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.82.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.82.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.82.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.82.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.82.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.83.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.83.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.83.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.83.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.83.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.83.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.84.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.84.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.84.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.84.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.84.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.84.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.85.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.85.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.85.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.85.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.85.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.85.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.86.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.86.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.86.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.86.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.86.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.86.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.87.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.87.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.87.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.87.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.87.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.87.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.88.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.88.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.88.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.88.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.88.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.88.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.89.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.89.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.89.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.89.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.89.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.89.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.9.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.9.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.9.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.9.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.9.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.9.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.90.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.90.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.90.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.90.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.90.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.90.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.91.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.91.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.91.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.91.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.91.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.91.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.92.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.92.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.92.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.92.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.92.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.92.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.93.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.93.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.93.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.93.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.93.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.93.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.94.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.94.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.94.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.94.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.94.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.94.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.95.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.95.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.95.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.95.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.95.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.95.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.96.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.96.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.96.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.96.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.96.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.96.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.97.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.97.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.97.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.97.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.97.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.97.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.98.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.98.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.98.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.98.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.98.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.98.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.99.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.99.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.99.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.99.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.99.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.experts.99.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.gate.e_score_correction_bias": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.gate.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.shared_experts.down_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.shared_experts.down_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.shared_experts.gate_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.shared_experts.gate_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.shared_experts.up_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.mlp.shared_experts.up_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.post_attention_layernorm.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.self_attn.k_norm.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.self_attn.k_proj.bias": "model-00080-of-00092.safetensors",
+ "model.layers.79.self_attn.k_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.self_attn.k_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.self_attn.o_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.self_attn.o_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.self_attn.q_norm.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.self_attn.q_proj.bias": "model-00080-of-00092.safetensors",
+ "model.layers.79.self_attn.q_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.self_attn.q_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.79.self_attn.v_proj.bias": "model-00080-of-00092.safetensors",
+ "model.layers.79.self_attn.v_proj.weight": "model-00080-of-00092.safetensors",
+ "model.layers.79.self_attn.v_proj.weight_scale": "model-00080-of-00092.safetensors",
+ "model.layers.8.input_layernorm.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.0.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.0.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.0.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.0.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.0.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.0.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.1.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.1.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.1.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.1.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.1.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.1.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.10.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.10.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.10.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.10.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.10.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.10.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.100.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.100.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.100.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.100.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.100.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.100.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.101.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.101.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.101.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.101.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.101.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.101.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.102.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.102.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.102.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.102.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.102.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.102.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.103.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.103.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.103.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.103.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.103.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.103.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.104.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.104.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.104.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.104.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.104.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.104.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.105.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.105.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.105.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.105.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.105.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.105.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.106.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.106.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.106.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.106.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.106.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.106.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.107.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.107.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.107.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.107.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.107.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.107.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.108.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.108.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.108.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.108.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.108.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.108.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.109.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.109.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.109.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.109.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.109.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.109.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.11.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.11.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.11.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.11.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.11.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.11.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.110.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.110.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.110.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.110.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.110.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.110.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.111.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.111.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.111.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.111.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.111.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.111.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.112.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.112.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.112.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.112.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.112.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.112.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.113.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.113.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.113.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.113.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.113.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.113.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.114.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.114.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.114.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.114.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.114.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.114.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.115.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.115.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.115.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.115.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.115.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.115.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.116.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.116.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.116.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.116.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.116.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.116.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.117.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.117.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.117.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.117.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.117.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.117.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.118.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.118.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.118.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.118.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.118.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.118.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.119.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.119.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.119.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.119.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.119.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.119.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.12.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.12.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.12.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.12.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.12.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.12.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.120.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.120.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.120.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.120.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.120.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.120.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.121.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.121.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.121.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.121.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.121.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.121.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.122.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.122.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.122.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.122.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.122.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.122.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.123.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.123.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.123.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.123.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.123.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.123.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.124.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.124.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.124.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.124.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.124.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.124.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.125.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.125.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.125.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.125.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.125.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.125.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.126.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.126.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.126.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.126.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.126.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.126.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.127.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.127.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.127.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.127.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.127.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.127.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.128.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.128.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.128.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.128.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.128.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.128.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.129.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.129.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.129.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.129.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.129.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.129.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.13.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.13.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.13.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.13.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.13.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.13.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.130.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.130.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.130.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.130.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.130.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.130.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.131.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.131.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.131.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.131.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.131.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.131.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.132.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.132.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.132.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.132.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.132.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.132.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.133.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.133.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.133.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.133.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.133.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.133.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.134.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.134.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.134.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.134.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.134.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.134.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.135.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.135.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.135.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.135.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.135.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.135.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.136.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.136.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.136.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.136.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.136.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.136.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.137.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.137.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.137.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.137.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.137.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.137.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.138.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.138.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.138.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.138.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.138.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.138.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.139.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.139.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.139.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.139.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.139.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.139.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.14.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.14.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.14.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.14.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.14.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.14.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.140.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.140.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.140.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.140.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.140.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.140.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.141.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.141.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.141.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.141.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.141.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.141.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.142.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.142.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.142.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.142.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.142.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.142.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.143.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.143.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.143.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.143.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.143.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.143.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.144.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.144.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.144.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.144.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.144.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.144.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.145.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.145.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.145.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.145.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.145.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.145.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.146.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.146.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.146.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.146.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.146.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.146.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.147.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.147.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.147.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.147.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.147.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.147.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.148.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.148.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.148.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.148.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.148.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.148.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.149.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.149.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.149.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.149.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.149.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.149.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.15.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.15.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.15.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.15.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.15.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.15.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.150.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.150.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.150.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.150.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.150.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.150.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.151.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.151.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.151.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.151.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.151.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.151.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.152.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.152.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.152.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.152.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.152.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.152.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.153.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.153.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.153.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.153.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.153.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.153.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.154.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.154.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.154.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.154.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.154.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.154.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.155.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.155.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.155.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.155.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.155.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.155.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.156.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.156.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.156.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.156.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.156.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.156.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.157.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.157.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.157.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.157.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.157.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.157.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.158.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.158.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.158.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.158.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.158.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.158.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.159.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.159.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.159.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.159.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.159.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.159.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.16.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.16.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.16.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.16.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.16.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.16.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.17.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.17.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.17.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.17.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.17.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.17.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.18.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.18.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.18.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.18.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.18.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.18.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.19.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.19.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.19.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.19.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.19.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.19.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.2.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.2.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.2.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.2.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.2.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.2.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.20.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.20.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.20.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.20.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.20.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.20.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.21.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.21.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.21.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.21.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.21.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.21.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.22.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.22.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.22.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.22.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.22.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.22.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.23.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.23.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.23.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.23.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.23.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.23.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.24.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.24.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.24.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.24.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.24.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.24.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.25.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.25.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.25.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.25.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.25.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.25.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.26.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.26.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.26.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.26.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.26.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.26.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.27.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.27.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.27.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.27.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.27.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.27.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.28.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.28.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.28.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.28.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.28.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.28.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.29.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.29.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.29.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.29.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.29.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.29.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.3.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.3.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.3.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.3.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.3.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.3.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.30.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.30.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.30.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.30.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.30.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.30.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.31.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.31.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.31.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.31.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.31.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.31.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.32.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.32.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.32.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.32.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.32.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.32.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.33.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.33.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.33.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.33.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.33.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.33.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.34.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.34.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.34.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.34.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.34.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.34.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.35.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.35.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.35.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.35.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.35.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.35.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.36.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.36.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.36.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.36.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.36.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.36.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.37.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.37.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.37.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.37.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.37.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.37.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.38.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.38.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.38.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.38.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.38.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.38.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.39.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.39.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.39.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.39.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.39.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.39.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.4.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.4.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.4.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.4.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.4.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.4.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.40.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.40.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.40.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.40.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.40.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.40.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.41.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.41.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.41.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.41.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.41.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.41.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.42.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.42.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.42.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.42.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.42.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.42.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.43.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.43.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.43.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.43.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.43.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.43.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.44.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.44.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.44.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.44.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.44.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.44.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.45.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.45.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.45.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.45.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.45.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.45.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.46.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.46.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.46.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.46.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.46.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.46.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.47.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.47.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.47.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.47.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.47.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.47.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.48.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.48.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.48.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.48.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.48.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.48.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.49.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.49.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.49.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.49.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.49.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.49.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.5.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.5.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.5.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.5.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.5.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.5.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.50.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.50.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.50.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.50.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.50.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.50.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.51.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.51.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.51.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.51.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.51.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.51.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.52.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.52.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.52.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.52.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.52.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.52.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.53.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.53.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.53.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.53.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.53.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.53.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.54.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.54.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.54.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.54.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.54.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.54.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.55.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.55.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.55.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.55.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.55.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.55.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.56.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.56.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.56.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.56.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.56.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.56.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.57.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.57.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.57.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.57.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.57.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.57.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.58.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.58.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.58.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.58.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.58.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.58.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.59.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.59.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.59.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.59.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.59.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.59.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.6.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.6.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.6.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.6.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.6.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.6.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.60.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.60.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.60.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.60.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.60.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.60.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.61.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.61.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.61.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.61.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.61.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.61.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.62.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.62.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.62.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.62.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.62.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.62.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.63.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.63.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.63.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.63.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.63.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.63.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.64.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.64.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.64.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.64.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.64.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.64.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.65.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.65.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.65.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.65.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.65.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.65.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.66.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.66.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.66.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.66.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.66.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.66.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.67.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.67.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.67.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.67.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.67.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.67.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.68.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.68.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.68.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.68.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.68.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.68.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.69.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.69.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.69.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.69.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.69.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.69.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.7.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.7.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.7.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.7.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.7.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.7.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.70.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.70.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.70.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.70.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.70.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.70.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.71.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.71.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.71.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.71.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.71.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.71.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.72.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.72.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.72.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.72.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.72.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.72.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.73.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.73.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.73.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.73.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.73.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.73.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.74.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.74.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.74.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.74.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.74.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.74.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.75.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.75.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.75.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.75.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.75.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.75.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.76.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.76.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.76.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.76.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.76.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.76.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.77.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.77.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.77.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.77.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.77.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.77.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.78.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.78.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.78.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.78.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.78.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.78.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.79.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.79.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.79.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.79.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.79.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.79.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.8.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.8.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.8.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.8.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.8.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.8.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.80.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.80.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.80.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.80.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.80.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.80.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.81.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.81.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.81.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.81.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.81.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.81.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.82.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.82.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.82.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.82.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.82.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.82.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.83.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.83.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.83.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.83.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.83.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.83.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.84.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.84.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.84.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.84.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.84.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.84.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.85.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.85.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.85.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.85.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.85.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.85.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.86.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.86.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.86.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.86.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.86.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.86.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.87.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.87.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.87.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.87.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.87.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.87.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.88.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.88.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.88.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.88.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.88.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.88.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.89.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.89.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.89.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.89.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.89.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.89.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.9.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.9.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.9.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.9.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.9.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.9.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.90.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.90.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.90.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.90.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.90.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.90.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.91.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.91.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.91.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.91.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.91.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.91.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.92.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.92.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.92.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.92.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.92.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.92.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.93.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.93.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.93.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.93.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.93.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.93.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.94.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.94.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.94.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.94.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.94.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.94.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.95.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.95.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.95.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.95.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.95.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.95.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.96.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.96.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.96.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.96.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.96.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.96.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.97.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.97.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.97.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.97.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.97.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.97.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.98.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.98.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.98.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.98.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.98.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.98.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.99.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.99.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.99.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.99.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.99.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.experts.99.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.gate.e_score_correction_bias": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.gate.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.shared_experts.down_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.shared_experts.down_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.shared_experts.gate_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.shared_experts.gate_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.shared_experts.up_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.mlp.shared_experts.up_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.post_attention_layernorm.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.self_attn.k_norm.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.self_attn.k_proj.bias": "model-00009-of-00092.safetensors",
+ "model.layers.8.self_attn.k_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.self_attn.k_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.self_attn.o_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.self_attn.o_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.self_attn.q_norm.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.self_attn.q_proj.bias": "model-00009-of-00092.safetensors",
+ "model.layers.8.self_attn.q_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.self_attn.q_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.8.self_attn.v_proj.bias": "model-00009-of-00092.safetensors",
+ "model.layers.8.self_attn.v_proj.weight": "model-00009-of-00092.safetensors",
+ "model.layers.8.self_attn.v_proj.weight_scale": "model-00009-of-00092.safetensors",
+ "model.layers.80.input_layernorm.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.0.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.0.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.0.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.0.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.0.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.0.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.1.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.1.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.1.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.1.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.1.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.1.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.10.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.10.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.10.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.10.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.10.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.10.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.100.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.100.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.100.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.100.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.100.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.100.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.101.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.101.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.101.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.101.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.101.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.101.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.102.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.102.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.102.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.102.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.102.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.102.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.103.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.103.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.103.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.103.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.103.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.103.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.104.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.104.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.104.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.104.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.104.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.104.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.105.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.105.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.105.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.105.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.105.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.105.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.106.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.106.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.106.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.106.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.106.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.106.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.107.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.107.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.107.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.107.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.107.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.107.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.108.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.108.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.108.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.108.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.108.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.108.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.109.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.109.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.109.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.109.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.109.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.109.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.11.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.11.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.11.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.11.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.11.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.11.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.110.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.110.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.110.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.110.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.110.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.110.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.111.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.111.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.111.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.111.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.111.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.111.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.112.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.112.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.112.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.112.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.112.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.112.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.113.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.113.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.113.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.113.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.113.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.113.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.114.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.114.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.114.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.114.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.114.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.114.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.115.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.115.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.115.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.115.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.115.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.115.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.116.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.116.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.116.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.116.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.116.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.116.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.117.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.117.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.117.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.117.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.117.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.117.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.118.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.118.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.118.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.118.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.118.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.118.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.119.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.119.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.119.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.119.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.119.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.119.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.12.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.12.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.12.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.12.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.12.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.12.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.120.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.120.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.120.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.120.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.120.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.120.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.121.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.121.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.121.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.121.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.121.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.121.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.122.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.122.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.122.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.122.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.122.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.122.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.123.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.123.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.123.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.123.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.123.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.123.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.124.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.124.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.124.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.124.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.124.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.124.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.125.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.125.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.125.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.125.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.125.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.125.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.126.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.126.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.126.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.126.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.126.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.126.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.127.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.127.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.127.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.127.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.127.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.127.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.128.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.128.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.128.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.128.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.128.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.128.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.129.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.129.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.129.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.129.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.129.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.129.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.13.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.13.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.13.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.13.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.13.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.13.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.130.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.130.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.130.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.130.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.130.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.130.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.131.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.131.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.131.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.131.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.131.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.131.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.132.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.132.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.132.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.132.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.132.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.132.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.133.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.133.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.133.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.133.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.133.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.133.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.134.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.134.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.134.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.134.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.134.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.134.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.135.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.135.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.135.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.135.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.135.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.135.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.136.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.136.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.136.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.136.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.136.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.136.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.137.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.137.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.137.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.137.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.137.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.137.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.138.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.138.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.138.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.138.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.138.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.138.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.139.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.139.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.139.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.139.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.139.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.139.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.14.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.14.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.14.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.14.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.14.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.14.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.140.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.140.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.140.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.140.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.140.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.140.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.141.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.141.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.141.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.141.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.141.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.141.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.142.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.142.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.142.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.142.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.142.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.142.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.143.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.143.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.143.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.143.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.143.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.143.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.144.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.144.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.144.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.144.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.144.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.144.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.145.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.145.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.145.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.145.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.145.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.145.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.146.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.146.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.146.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.146.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.146.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.146.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.147.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.147.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.147.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.147.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.147.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.147.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.148.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.148.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.148.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.148.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.148.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.148.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.149.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.149.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.149.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.149.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.149.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.149.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.15.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.15.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.15.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.15.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.15.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.15.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.150.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.150.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.150.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.150.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.150.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.150.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.151.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.151.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.151.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.151.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.151.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.151.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.152.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.152.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.152.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.152.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.152.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.152.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.153.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.153.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.153.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.153.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.153.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.153.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.154.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.154.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.154.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.154.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.154.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.154.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.155.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.155.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.155.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.155.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.155.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.155.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.156.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.156.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.156.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.156.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.156.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.156.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.157.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.157.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.157.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.157.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.157.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.157.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.158.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.158.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.158.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.158.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.158.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.158.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.159.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.159.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.159.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.159.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.159.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.159.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.16.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.16.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.16.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.16.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.16.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.16.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.17.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.17.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.17.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.17.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.17.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.17.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.18.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.18.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.18.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.18.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.18.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.18.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.19.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.19.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.19.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.19.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.19.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.19.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.2.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.2.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.2.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.2.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.2.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.2.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.20.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.20.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.20.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.20.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.20.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.20.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.21.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.21.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.21.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.21.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.21.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.21.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.22.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.22.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.22.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.22.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.22.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.22.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.23.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.23.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.23.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.23.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.23.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.23.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.24.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.24.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.24.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.24.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.24.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.24.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.25.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.25.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.25.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.25.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.25.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.25.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.26.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.26.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.26.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.26.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.26.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.26.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.27.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.27.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.27.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.27.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.27.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.27.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.28.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.28.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.28.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.28.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.28.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.28.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.29.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.29.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.29.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.29.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.29.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.29.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.3.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.3.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.3.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.3.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.3.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.3.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.30.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.30.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.30.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.30.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.30.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.30.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.31.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.31.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.31.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.31.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.31.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.31.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.32.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.32.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.32.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.32.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.32.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.32.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.33.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.33.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.33.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.33.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.33.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.33.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.34.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.34.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.34.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.34.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.34.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.34.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.35.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.35.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.35.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.35.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.35.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.35.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.36.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.36.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.36.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.36.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.36.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.36.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.37.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.37.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.37.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.37.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.37.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.37.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.38.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.38.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.38.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.38.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.38.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.38.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.39.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.39.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.39.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.39.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.39.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.39.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.4.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.4.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.4.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.4.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.4.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.4.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.40.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.40.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.40.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.40.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.40.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.40.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.41.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.41.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.41.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.41.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.41.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.41.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.42.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.42.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.42.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.42.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.42.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.42.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.43.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.43.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.43.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.43.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.43.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.43.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.44.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.44.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.44.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.44.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.44.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.44.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.45.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.45.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.45.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.45.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.45.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.45.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.46.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.46.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.46.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.46.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.46.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.46.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.47.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.47.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.47.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.47.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.47.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.47.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.48.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.48.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.48.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.48.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.48.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.48.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.49.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.49.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.49.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.49.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.49.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.49.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.5.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.5.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.5.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.5.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.5.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.5.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.50.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.50.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.50.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.50.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.50.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.50.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.51.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.51.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.51.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.51.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.51.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.51.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.52.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.52.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.52.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.52.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.52.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.52.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.53.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.53.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.53.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.53.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.53.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.53.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.54.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.54.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.54.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.54.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.54.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.54.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.55.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.55.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.55.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.55.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.55.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.55.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.56.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.56.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.56.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.56.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.56.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.56.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.57.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.57.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.57.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.57.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.57.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.57.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.58.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.58.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.58.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.58.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.58.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.58.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.59.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.59.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.59.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.59.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.59.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.59.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.6.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.6.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.6.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.6.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.6.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.6.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.60.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.60.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.60.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.60.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.60.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.60.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.61.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.61.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.61.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.61.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.61.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.61.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.62.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.62.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.62.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.62.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.62.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.62.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.63.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.63.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.63.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.63.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.63.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.63.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.64.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.64.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.64.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.64.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.64.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.64.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.65.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.65.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.65.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.65.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.65.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.65.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.66.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.66.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.66.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.66.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.66.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.66.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.67.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.67.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.67.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.67.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.67.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.67.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.68.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.68.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.68.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.68.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.68.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.68.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.69.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.69.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.69.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.69.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.69.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.69.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.7.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.7.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.7.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.7.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.7.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.7.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.70.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.70.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.70.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.70.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.70.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.70.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.71.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.71.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.71.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.71.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.71.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.71.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.72.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.72.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.72.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.72.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.72.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.72.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.73.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.73.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.73.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.73.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.73.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.73.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.74.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.74.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.74.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.74.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.74.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.74.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.75.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.75.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.75.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.75.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.75.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.75.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.76.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.76.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.76.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.76.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.76.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.76.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.77.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.77.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.77.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.77.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.77.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.77.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.78.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.78.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.78.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.78.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.78.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.78.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.79.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.79.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.79.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.79.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.79.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.79.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.8.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.8.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.8.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.8.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.8.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.8.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.80.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.80.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.80.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.80.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.80.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.80.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.81.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.81.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.81.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.81.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.81.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.81.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.82.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.82.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.82.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.82.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.82.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.82.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.83.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.83.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.83.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.83.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.83.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.83.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.84.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.84.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.84.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.84.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.84.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.84.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.85.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.85.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.85.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.85.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.85.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.85.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.86.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.86.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.86.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.86.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.86.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.86.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.87.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.87.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.87.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.87.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.87.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.87.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.88.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.88.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.88.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.88.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.88.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.88.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.89.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.89.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.89.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.89.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.89.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.89.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.9.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.9.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.9.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.9.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.9.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.9.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.90.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.90.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.90.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.90.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.90.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.90.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.91.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.91.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.91.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.91.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.91.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.91.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.92.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.92.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.92.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.92.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.92.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.92.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.93.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.93.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.93.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.93.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.93.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.93.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.94.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.94.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.94.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.94.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.94.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.94.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.95.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.95.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.95.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.95.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.95.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.95.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.96.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.96.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.96.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.96.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.96.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.96.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.97.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.97.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.97.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.97.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.97.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.97.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.98.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.98.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.98.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.98.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.98.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.98.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.99.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.99.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.99.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.99.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.99.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.experts.99.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.gate.e_score_correction_bias": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.gate.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.shared_experts.down_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.shared_experts.down_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.shared_experts.gate_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.shared_experts.gate_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.shared_experts.up_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.mlp.shared_experts.up_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.post_attention_layernorm.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.self_attn.k_norm.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.self_attn.k_proj.bias": "model-00081-of-00092.safetensors",
+ "model.layers.80.self_attn.k_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.self_attn.k_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.self_attn.o_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.self_attn.o_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.self_attn.q_norm.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.self_attn.q_proj.bias": "model-00081-of-00092.safetensors",
+ "model.layers.80.self_attn.q_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.self_attn.q_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.80.self_attn.v_proj.bias": "model-00081-of-00092.safetensors",
+ "model.layers.80.self_attn.v_proj.weight": "model-00081-of-00092.safetensors",
+ "model.layers.80.self_attn.v_proj.weight_scale": "model-00081-of-00092.safetensors",
+ "model.layers.81.input_layernorm.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.0.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.0.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.0.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.0.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.0.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.0.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.1.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.1.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.1.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.1.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.1.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.1.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.10.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.10.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.10.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.10.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.10.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.10.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.100.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.100.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.100.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.100.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.100.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.100.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.101.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.101.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.101.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.101.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.101.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.101.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.102.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.102.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.102.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.102.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.102.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.102.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.103.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.103.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.103.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.103.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.103.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.103.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.104.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.104.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.104.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.104.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.104.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.104.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.105.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.105.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.105.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.105.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.105.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.105.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.106.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.106.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.106.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.106.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.106.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.106.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.107.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.107.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.107.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.107.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.107.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.107.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.108.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.108.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.108.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.108.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.108.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.108.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.109.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.109.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.109.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.109.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.109.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.109.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.11.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.11.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.11.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.11.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.11.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.11.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.110.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.110.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.110.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.110.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.110.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.110.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.111.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.111.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.111.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.111.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.111.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.111.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.112.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.112.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.112.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.112.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.112.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.112.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.113.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.113.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.113.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.113.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.113.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.113.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.114.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.114.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.114.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.114.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.114.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.114.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.115.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.115.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.115.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.115.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.115.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.115.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.116.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.116.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.116.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.116.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.116.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.116.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.117.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.117.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.117.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.117.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.117.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.117.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.118.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.118.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.118.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.118.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.118.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.118.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.119.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.119.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.119.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.119.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.119.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.119.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.12.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.12.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.12.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.12.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.12.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.12.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.120.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.120.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.120.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.120.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.120.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.120.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.121.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.121.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.121.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.121.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.121.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.121.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.122.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.122.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.122.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.122.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.122.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.122.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.123.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.123.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.123.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.123.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.123.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.123.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.124.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.124.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.124.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.124.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.124.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.124.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.125.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.125.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.125.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.125.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.125.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.125.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.126.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.126.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.126.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.126.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.126.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.126.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.127.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.127.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.127.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.127.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.127.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.127.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.128.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.128.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.128.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.128.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.128.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.128.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.129.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.129.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.129.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.129.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.129.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.129.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.13.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.13.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.13.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.13.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.13.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.13.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.130.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.130.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.130.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.130.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.130.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.130.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.131.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.131.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.131.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.131.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.131.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.131.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.132.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.132.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.132.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.132.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.132.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.132.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.133.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.133.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.133.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.133.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.133.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.133.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.134.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.134.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.134.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.134.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.134.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.134.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.135.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.135.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.135.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.135.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.135.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.135.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.136.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.136.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.136.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.136.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.136.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.136.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.137.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.137.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.137.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.137.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.137.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.137.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.138.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.138.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.138.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.138.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.138.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.138.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.139.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.139.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.139.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.139.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.139.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.139.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.14.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.14.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.14.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.14.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.14.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.14.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.140.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.140.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.140.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.140.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.140.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.140.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.141.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.141.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.141.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.141.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.141.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.141.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.142.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.142.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.142.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.142.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.142.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.142.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.143.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.143.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.143.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.143.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.143.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.143.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.144.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.144.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.144.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.144.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.144.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.144.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.145.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.145.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.145.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.145.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.145.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.145.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.146.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.146.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.146.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.146.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.146.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.146.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.147.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.147.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.147.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.147.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.147.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.147.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.148.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.148.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.148.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.148.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.148.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.148.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.149.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.149.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.149.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.149.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.149.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.149.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.15.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.15.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.15.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.15.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.15.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.15.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.150.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.150.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.150.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.150.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.150.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.150.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.151.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.151.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.151.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.151.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.151.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.151.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.152.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.152.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.152.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.152.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.152.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.152.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.153.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.153.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.153.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.153.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.153.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.153.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.154.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.154.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.154.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.154.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.154.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.154.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.155.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.155.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.155.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.155.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.155.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.155.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.156.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.156.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.156.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.156.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.156.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.156.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.157.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.157.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.157.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.157.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.157.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.157.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.158.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.158.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.158.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.158.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.158.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.158.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.159.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.159.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.159.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.159.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.159.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.159.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.16.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.16.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.16.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.16.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.16.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.16.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.17.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.17.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.17.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.17.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.17.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.17.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.18.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.18.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.18.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.18.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.18.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.18.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.19.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.19.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.19.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.19.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.19.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.19.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.2.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.2.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.2.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.2.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.2.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.2.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.20.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.20.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.20.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.20.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.20.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.20.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.21.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.21.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.21.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.21.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.21.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.21.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.22.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.22.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.22.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.22.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.22.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.22.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.23.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.23.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.23.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.23.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.23.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.23.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.24.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.24.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.24.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.24.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.24.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.24.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.25.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.25.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.25.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.25.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.25.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.25.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.26.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.26.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.26.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.26.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.26.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.26.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.27.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.27.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.27.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.27.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.27.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.27.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.28.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.28.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.28.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.28.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.28.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.28.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.29.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.29.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.29.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.29.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.29.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.29.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.3.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.3.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.3.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.3.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.3.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.3.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.30.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.30.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.30.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.30.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.30.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.30.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.31.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.31.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.31.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.31.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.31.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.31.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.32.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.32.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.32.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.32.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.32.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.32.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.33.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.33.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.33.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.33.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.33.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.33.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.34.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.34.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.34.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.34.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.34.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.34.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.35.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.35.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.35.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.35.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.35.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.35.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.36.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.36.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.36.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.36.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.36.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.36.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.37.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.37.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.37.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.37.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.37.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.37.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.38.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.38.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.38.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.38.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.38.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.38.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.39.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.39.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.39.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.39.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.39.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.39.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.4.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.4.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.4.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.4.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.4.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.4.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.40.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.40.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.40.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.40.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.40.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.40.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.41.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.41.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.41.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.41.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.41.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.41.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.42.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.42.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.42.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.42.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.42.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.42.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.43.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.43.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.43.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.43.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.43.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.43.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.44.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.44.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.44.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.44.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.44.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.44.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.45.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.45.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.45.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.45.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.45.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.45.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.46.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.46.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.46.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.46.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.46.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.46.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.47.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.47.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.47.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.47.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.47.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.47.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.48.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.48.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.48.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.48.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.48.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.48.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.49.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.49.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.49.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.49.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.49.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.49.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.5.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.5.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.5.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.5.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.5.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.5.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.50.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.50.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.50.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.50.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.50.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.50.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.51.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.51.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.51.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.51.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.51.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.51.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.52.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.52.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.52.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.52.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.52.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.52.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.53.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.53.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.53.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.53.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.53.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.53.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.54.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.54.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.54.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.54.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.54.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.54.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.55.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.55.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.55.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.55.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.55.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.55.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.56.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.56.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.56.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.56.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.56.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.56.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.57.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.57.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.57.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.57.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.57.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.57.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.58.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.58.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.58.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.58.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.58.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.58.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.59.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.59.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.59.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.59.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.59.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.59.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.6.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.6.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.6.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.6.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.6.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.6.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.60.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.60.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.60.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.60.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.60.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.60.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.61.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.61.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.61.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.61.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.61.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.61.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.62.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.62.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.62.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.62.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.62.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.62.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.63.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.63.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.63.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.63.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.63.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.63.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.64.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.64.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.64.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.64.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.64.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.64.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.65.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.65.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.65.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.65.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.65.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.65.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.66.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.66.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.66.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.66.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.66.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.66.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.67.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.67.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.67.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.67.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.67.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.67.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.68.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.68.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.68.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.68.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.68.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.68.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.69.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.69.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.69.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.69.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.69.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.69.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.7.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.7.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.7.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.7.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.7.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.7.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.70.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.70.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.70.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.70.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.70.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.70.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.71.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.71.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.71.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.71.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.71.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.71.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.72.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.72.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.72.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.72.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.72.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.72.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.73.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.73.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.73.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.73.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.73.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.73.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.74.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.74.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.74.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.74.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.74.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.74.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.75.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.75.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.75.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.75.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.75.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.75.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.76.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.76.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.76.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.76.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.76.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.76.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.77.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.77.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.77.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.77.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.77.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.77.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.78.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.78.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.78.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.78.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.78.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.78.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.79.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.79.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.79.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.79.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.79.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.79.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.8.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.8.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.8.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.8.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.8.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.8.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.80.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.80.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.80.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.80.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.80.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.80.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.81.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.81.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.81.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.81.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.81.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.81.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.82.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.82.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.82.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.82.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.82.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.82.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.83.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.83.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.83.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.83.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.83.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.83.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.84.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.84.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.84.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.84.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.84.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.84.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.85.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.85.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.85.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.85.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.85.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.85.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.86.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.86.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.86.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.86.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.86.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.86.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.87.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.87.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.87.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.87.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.87.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.87.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.88.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.88.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.88.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.88.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.88.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.88.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.89.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.89.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.89.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.89.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.89.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.89.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.9.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.9.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.9.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.9.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.9.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.9.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.90.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.90.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.90.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.90.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.90.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.90.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.91.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.91.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.91.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.91.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.91.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.91.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.92.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.92.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.92.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.92.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.92.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.92.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.93.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.93.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.93.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.93.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.93.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.93.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.94.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.94.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.94.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.94.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.94.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.94.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.95.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.95.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.95.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.95.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.95.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.95.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.96.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.96.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.96.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.96.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.96.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.96.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.97.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.97.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.97.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.97.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.97.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.97.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.98.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.98.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.98.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.98.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.98.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.98.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.99.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.99.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.99.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.99.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.99.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.experts.99.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.gate.e_score_correction_bias": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.gate.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.shared_experts.down_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.shared_experts.down_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.shared_experts.gate_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.shared_experts.gate_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.shared_experts.up_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.mlp.shared_experts.up_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.post_attention_layernorm.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.self_attn.k_norm.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.self_attn.k_proj.bias": "model-00082-of-00092.safetensors",
+ "model.layers.81.self_attn.k_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.self_attn.k_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.self_attn.o_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.self_attn.o_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.self_attn.q_norm.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.self_attn.q_proj.bias": "model-00082-of-00092.safetensors",
+ "model.layers.81.self_attn.q_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.self_attn.q_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.81.self_attn.v_proj.bias": "model-00082-of-00092.safetensors",
+ "model.layers.81.self_attn.v_proj.weight": "model-00082-of-00092.safetensors",
+ "model.layers.81.self_attn.v_proj.weight_scale": "model-00082-of-00092.safetensors",
+ "model.layers.82.input_layernorm.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.0.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.0.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.0.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.0.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.0.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.0.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.1.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.1.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.1.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.1.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.1.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.1.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.10.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.10.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.10.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.10.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.10.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.10.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.100.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.100.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.100.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.100.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.100.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.100.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.101.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.101.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.101.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.101.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.101.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.101.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.102.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.102.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.102.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.102.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.102.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.102.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.103.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.103.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.103.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.103.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.103.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.103.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.104.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.104.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.104.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.104.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.104.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.104.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.105.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.105.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.105.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.105.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.105.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.105.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.106.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.106.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.106.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.106.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.106.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.106.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.107.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.107.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.107.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.107.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.107.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.107.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.108.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.108.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.108.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.108.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.108.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.108.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.109.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.109.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.109.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.109.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.109.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.109.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.11.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.11.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.11.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.11.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.11.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.11.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.110.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.110.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.110.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.110.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.110.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.110.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.111.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.111.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.111.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.111.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.111.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.111.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.112.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.112.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.112.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.112.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.112.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.112.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.113.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.113.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.113.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.113.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.113.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.113.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.114.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.114.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.114.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.114.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.114.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.114.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.115.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.115.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.115.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.115.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.115.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.115.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.116.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.116.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.116.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.116.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.116.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.116.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.117.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.117.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.117.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.117.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.117.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.117.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.118.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.118.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.118.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.118.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.118.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.118.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.119.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.119.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.119.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.119.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.119.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.119.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.12.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.12.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.12.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.12.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.12.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.12.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.120.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.120.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.120.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.120.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.120.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.120.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.121.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.121.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.121.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.121.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.121.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.121.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.122.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.122.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.122.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.122.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.122.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.122.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.123.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.123.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.123.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.123.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.123.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.123.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.124.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.124.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.124.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.124.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.124.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.124.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.125.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.125.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.125.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.125.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.125.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.125.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.126.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.126.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.126.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.126.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.126.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.126.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.127.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.127.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.127.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.127.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.127.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.127.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.128.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.128.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.128.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.128.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.128.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.128.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.129.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.129.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.129.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.129.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.129.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.129.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.13.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.13.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.13.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.13.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.13.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.13.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.130.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.130.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.130.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.130.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.130.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.130.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.131.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.131.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.131.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.131.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.131.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.131.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.132.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.132.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.132.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.132.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.132.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.132.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.133.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.133.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.133.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.133.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.133.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.133.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.134.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.134.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.134.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.134.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.134.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.134.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.135.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.135.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.135.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.135.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.135.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.135.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.136.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.136.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.136.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.136.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.136.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.136.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.137.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.137.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.137.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.137.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.137.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.137.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.138.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.138.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.138.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.138.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.138.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.138.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.139.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.139.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.139.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.139.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.139.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.139.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.14.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.14.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.14.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.14.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.14.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.14.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.140.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.140.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.140.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.140.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.140.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.140.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.141.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.141.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.141.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.141.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.141.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.141.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.142.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.142.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.142.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.142.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.142.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.142.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.143.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.143.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.143.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.143.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.143.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.143.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.144.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.144.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.144.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.144.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.144.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.144.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.145.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.145.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.145.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.145.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.145.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.145.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.146.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.146.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.146.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.146.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.146.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.146.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.147.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.147.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.147.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.147.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.147.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.147.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.148.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.148.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.148.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.148.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.148.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.148.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.149.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.149.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.149.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.149.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.149.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.149.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.15.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.15.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.15.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.15.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.15.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.15.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.150.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.150.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.150.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.150.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.150.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.150.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.151.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.151.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.151.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.151.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.151.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.151.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.152.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.152.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.152.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.152.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.152.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.152.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.153.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.153.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.153.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.153.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.153.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.153.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.154.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.154.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.154.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.154.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.154.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.154.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.155.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.155.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.155.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.155.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.155.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.155.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.156.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.156.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.156.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.156.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.156.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.156.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.157.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.157.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.157.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.157.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.157.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.157.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.158.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.158.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.158.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.158.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.158.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.158.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.159.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.159.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.159.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.159.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.159.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.159.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.16.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.16.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.16.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.16.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.16.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.16.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.17.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.17.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.17.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.17.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.17.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.17.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.18.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.18.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.18.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.18.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.18.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.18.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.19.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.19.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.19.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.19.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.19.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.19.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.2.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.2.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.2.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.2.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.2.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.2.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.20.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.20.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.20.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.20.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.20.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.20.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.21.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.21.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.21.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.21.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.21.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.21.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.22.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.22.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.22.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.22.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.22.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.22.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.23.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.23.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.23.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.23.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.23.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.23.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.24.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.24.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.24.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.24.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.24.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.24.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.25.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.25.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.25.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.25.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.25.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.25.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.26.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.26.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.26.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.26.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.26.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.26.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.27.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.27.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.27.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.27.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.27.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.27.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.28.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.28.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.28.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.28.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.28.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.28.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.29.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.29.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.29.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.29.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.29.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.29.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.3.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.3.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.3.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.3.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.3.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.3.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.30.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.30.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.30.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.30.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.30.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.30.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.31.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.31.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.31.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.31.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.31.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.31.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.32.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.32.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.32.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.32.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.32.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.32.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.33.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.33.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.33.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.33.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.33.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.33.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.34.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.34.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.34.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.34.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.34.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.34.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.35.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.35.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.35.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.35.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.35.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.35.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.36.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.36.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.36.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.36.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.36.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.36.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.37.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.37.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.37.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.37.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.37.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.37.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.38.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.38.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.38.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.38.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.38.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.38.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.39.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.39.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.39.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.39.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.39.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.39.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.4.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.4.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.4.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.4.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.4.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.4.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.40.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.40.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.40.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.40.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.40.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.40.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.41.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.41.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.41.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.41.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.41.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.41.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.42.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.42.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.42.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.42.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.42.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.42.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.43.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.43.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.43.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.43.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.43.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.43.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.44.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.44.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.44.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.44.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.44.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.44.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.45.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.45.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.45.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.45.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.45.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.45.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.46.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.46.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.46.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.46.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.46.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.46.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.47.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.47.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.47.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.47.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.47.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.47.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.48.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.48.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.48.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.48.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.48.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.48.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.49.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.49.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.49.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.49.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.49.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.49.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.5.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.5.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.5.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.5.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.5.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.5.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.50.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.50.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.50.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.50.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.50.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.50.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.51.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.51.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.51.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.51.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.51.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.51.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.52.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.52.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.52.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.52.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.52.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.52.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.53.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.53.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.53.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.53.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.53.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.53.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.54.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.54.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.54.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.54.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.54.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.54.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.55.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.55.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.55.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.55.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.55.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.55.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.56.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.56.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.56.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.56.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.56.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.56.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.57.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.57.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.57.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.57.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.57.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.57.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.58.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.58.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.58.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.58.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.58.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.58.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.59.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.59.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.59.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.59.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.59.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.59.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.6.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.6.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.6.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.6.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.6.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.6.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.60.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.60.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.60.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.60.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.60.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.60.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.61.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.61.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.61.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.61.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.61.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.61.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.62.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.62.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.62.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.62.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.62.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.62.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.63.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.63.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.63.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.63.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.63.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.63.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.64.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.64.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.64.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.64.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.64.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.64.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.65.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.65.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.65.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.65.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.65.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.65.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.66.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.66.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.66.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.66.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.66.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.66.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.67.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.67.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.67.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.67.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.67.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.67.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.68.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.68.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.68.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.68.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.68.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.68.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.69.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.69.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.69.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.69.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.69.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.69.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.7.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.7.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.7.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.7.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.7.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.7.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.70.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.70.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.70.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.70.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.70.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.70.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.71.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.71.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.71.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.71.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.71.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.71.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.72.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.72.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.72.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.72.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.72.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.72.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.73.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.73.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.73.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.73.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.73.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.73.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.74.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.74.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.74.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.74.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.74.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.74.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.75.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.75.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.75.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.75.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.75.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.75.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.76.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.76.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.76.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.76.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.76.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.76.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.77.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.77.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.77.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.77.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.77.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.77.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.78.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.78.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.78.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.78.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.78.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.78.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.79.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.79.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.79.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.79.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.79.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.79.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.8.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.8.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.8.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.8.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.8.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.8.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.80.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.80.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.80.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.80.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.80.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.80.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.81.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.81.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.81.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.81.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.81.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.81.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.82.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.82.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.82.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.82.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.82.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.82.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.83.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.83.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.83.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.83.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.83.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.83.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.84.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.84.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.84.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.84.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.84.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.84.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.85.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.85.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.85.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.85.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.85.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.85.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.86.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.86.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.86.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.86.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.86.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.86.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.87.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.87.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.87.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.87.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.87.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.87.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.88.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.88.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.88.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.88.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.88.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.88.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.89.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.89.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.89.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.89.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.89.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.89.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.9.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.9.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.9.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.9.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.9.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.9.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.90.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.90.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.90.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.90.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.90.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.90.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.91.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.91.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.91.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.91.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.91.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.91.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.92.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.92.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.92.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.92.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.92.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.92.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.93.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.93.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.93.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.93.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.93.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.93.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.94.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.94.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.94.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.94.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.94.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.94.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.95.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.95.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.95.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.95.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.95.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.95.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.96.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.96.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.96.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.96.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.96.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.96.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.97.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.97.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.97.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.97.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.97.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.97.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.98.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.98.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.98.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.98.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.98.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.98.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.99.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.99.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.99.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.99.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.99.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.experts.99.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.gate.e_score_correction_bias": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.gate.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.shared_experts.down_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.shared_experts.down_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.shared_experts.gate_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.shared_experts.gate_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.shared_experts.up_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.mlp.shared_experts.up_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.post_attention_layernorm.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.self_attn.k_norm.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.self_attn.k_proj.bias": "model-00083-of-00092.safetensors",
+ "model.layers.82.self_attn.k_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.self_attn.k_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.self_attn.o_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.self_attn.o_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.self_attn.q_norm.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.self_attn.q_proj.bias": "model-00083-of-00092.safetensors",
+ "model.layers.82.self_attn.q_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.self_attn.q_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.82.self_attn.v_proj.bias": "model-00083-of-00092.safetensors",
+ "model.layers.82.self_attn.v_proj.weight": "model-00083-of-00092.safetensors",
+ "model.layers.82.self_attn.v_proj.weight_scale": "model-00083-of-00092.safetensors",
+ "model.layers.83.input_layernorm.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.0.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.0.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.0.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.0.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.0.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.0.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.1.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.1.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.1.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.1.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.1.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.1.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.10.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.10.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.10.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.10.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.10.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.10.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.100.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.100.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.100.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.100.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.100.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.100.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.101.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.101.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.101.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.101.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.101.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.101.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.102.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.102.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.102.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.102.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.102.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.102.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.103.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.103.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.103.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.103.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.103.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.103.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.104.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.104.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.104.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.104.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.104.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.104.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.105.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.105.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.105.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.105.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.105.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.105.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.106.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.106.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.106.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.106.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.106.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.106.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.107.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.107.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.107.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.107.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.107.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.107.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.108.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.108.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.108.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.108.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.108.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.108.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.109.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.109.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.109.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.109.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.109.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.109.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.11.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.11.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.11.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.11.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.11.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.11.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.110.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.110.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.110.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.110.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.110.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.110.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.111.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.111.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.111.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.111.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.111.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.111.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.112.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.112.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.112.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.112.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.112.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.112.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.113.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.113.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.113.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.113.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.113.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.113.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.114.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.114.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.114.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.114.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.114.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.114.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.115.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.115.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.115.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.115.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.115.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.115.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.116.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.116.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.116.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.116.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.116.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.116.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.117.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.117.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.117.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.117.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.117.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.117.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.118.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.118.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.118.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.118.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.118.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.118.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.119.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.119.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.119.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.119.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.119.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.119.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.12.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.12.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.12.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.12.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.12.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.12.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.120.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.120.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.120.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.120.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.120.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.120.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.121.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.121.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.121.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.121.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.121.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.121.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.122.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.122.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.122.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.122.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.122.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.122.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.123.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.123.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.123.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.123.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.123.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.123.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.124.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.124.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.124.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.124.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.124.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.124.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.125.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.125.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.125.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.125.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.125.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.125.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.126.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.126.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.126.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.126.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.126.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.126.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.127.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.127.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.127.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.127.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.127.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.127.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.128.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.128.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.128.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.128.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.128.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.128.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.129.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.129.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.129.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.129.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.129.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.129.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.13.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.13.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.13.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.13.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.13.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.13.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.130.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.130.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.130.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.130.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.130.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.130.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.131.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.131.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.131.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.131.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.131.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.131.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.132.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.132.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.132.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.132.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.132.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.132.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.133.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.133.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.133.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.133.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.133.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.133.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.134.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.134.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.134.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.134.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.134.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.134.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.135.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.135.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.135.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.135.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.135.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.135.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.136.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.136.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.136.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.136.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.136.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.136.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.137.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.137.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.137.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.137.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.137.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.137.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.138.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.138.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.138.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.138.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.138.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.138.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.139.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.139.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.139.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.139.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.139.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.139.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.14.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.14.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.14.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.14.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.14.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.14.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.140.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.140.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.140.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.140.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.140.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.140.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.141.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.141.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.141.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.141.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.141.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.141.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.142.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.142.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.142.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.142.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.142.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.142.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.143.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.143.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.143.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.143.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.143.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.143.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.144.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.144.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.144.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.144.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.144.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.144.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.145.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.145.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.145.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.145.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.145.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.145.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.146.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.146.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.146.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.146.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.146.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.146.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.147.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.147.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.147.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.147.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.147.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.147.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.148.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.148.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.148.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.148.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.148.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.148.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.149.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.149.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.149.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.149.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.149.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.149.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.15.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.15.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.15.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.15.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.15.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.15.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.150.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.150.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.150.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.150.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.150.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.150.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.151.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.151.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.151.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.151.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.151.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.151.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.152.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.152.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.152.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.152.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.152.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.152.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.153.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.153.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.153.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.153.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.153.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.153.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.154.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.154.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.154.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.154.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.154.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.154.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.155.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.155.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.155.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.155.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.155.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.155.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.156.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.156.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.156.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.156.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.156.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.156.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.157.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.157.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.157.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.157.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.157.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.157.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.158.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.158.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.158.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.158.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.158.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.158.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.159.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.159.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.159.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.159.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.159.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.159.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.16.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.16.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.16.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.16.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.16.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.16.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.17.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.17.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.17.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.17.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.17.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.17.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.18.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.18.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.18.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.18.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.18.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.18.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.19.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.19.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.19.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.19.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.19.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.19.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.2.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.2.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.2.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.2.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.2.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.2.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.20.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.20.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.20.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.20.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.20.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.20.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.21.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.21.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.21.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.21.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.21.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.21.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.22.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.22.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.22.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.22.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.22.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.22.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.23.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.23.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.23.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.23.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.23.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.23.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.24.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.24.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.24.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.24.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.24.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.24.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.25.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.25.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.25.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.25.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.25.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.25.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.26.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.26.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.26.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.26.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.26.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.26.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.27.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.27.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.27.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.27.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.27.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.27.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.28.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.28.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.28.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.28.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.28.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.28.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.29.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.29.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.29.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.29.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.29.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.29.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.3.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.3.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.3.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.3.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.3.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.3.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.30.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.30.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.30.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.30.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.30.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.30.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.31.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.31.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.31.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.31.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.31.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.31.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.32.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.32.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.32.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.32.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.32.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.32.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.33.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.33.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.33.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.33.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.33.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.33.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.34.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.34.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.34.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.34.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.34.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.34.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.35.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.35.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.35.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.35.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.35.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.35.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.36.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.36.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.36.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.36.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.36.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.36.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.37.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.37.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.37.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.37.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.37.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.37.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.38.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.38.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.38.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.38.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.38.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.38.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.39.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.39.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.39.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.39.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.39.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.39.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.4.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.4.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.4.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.4.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.4.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.4.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.40.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.40.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.40.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.40.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.40.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.40.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.41.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.41.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.41.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.41.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.41.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.41.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.42.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.42.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.42.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.42.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.42.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.42.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.43.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.43.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.43.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.43.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.43.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.43.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.44.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.44.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.44.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.44.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.44.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.44.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.45.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.45.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.45.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.45.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.45.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.45.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.46.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.46.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.46.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.46.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.46.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.46.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.47.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.47.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.47.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.47.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.47.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.47.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.48.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.48.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.48.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.48.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.48.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.48.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.49.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.49.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.49.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.49.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.49.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.49.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.5.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.5.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.5.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.5.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.5.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.5.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.50.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.50.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.50.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.50.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.50.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.50.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.51.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.51.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.51.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.51.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.51.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.51.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.52.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.52.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.52.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.52.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.52.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.52.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.53.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.53.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.53.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.53.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.53.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.53.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.54.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.54.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.54.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.54.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.54.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.54.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.55.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.55.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.55.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.55.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.55.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.55.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.56.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.56.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.56.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.56.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.56.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.56.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.57.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.57.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.57.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.57.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.57.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.57.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.58.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.58.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.58.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.58.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.58.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.58.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.59.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.59.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.59.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.59.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.59.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.59.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.6.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.6.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.6.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.6.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.6.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.6.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.60.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.60.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.60.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.60.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.60.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.60.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.61.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.61.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.61.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.61.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.61.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.61.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.62.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.62.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.62.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.62.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.62.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.62.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.63.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.63.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.63.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.63.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.63.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.63.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.64.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.64.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.64.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.64.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.64.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.64.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.65.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.65.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.65.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.65.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.65.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.65.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.66.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.66.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.66.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.66.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.66.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.66.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.67.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.67.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.67.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.67.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.67.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.67.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.68.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.68.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.68.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.68.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.68.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.68.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.69.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.69.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.69.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.69.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.69.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.69.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.7.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.7.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.7.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.7.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.7.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.7.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.70.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.70.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.70.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.70.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.70.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.70.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.71.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.71.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.71.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.71.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.71.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.71.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.72.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.72.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.72.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.72.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.72.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.72.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.73.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.73.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.73.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.73.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.73.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.73.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.74.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.74.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.74.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.74.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.74.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.74.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.75.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.75.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.75.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.75.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.75.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.75.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.76.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.76.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.76.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.76.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.76.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.76.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.77.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.77.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.77.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.77.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.77.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.77.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.78.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.78.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.78.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.78.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.78.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.78.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.79.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.79.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.79.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.79.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.79.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.79.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.8.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.8.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.8.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.8.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.8.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.8.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.80.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.80.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.80.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.80.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.80.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.80.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.81.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.81.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.81.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.81.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.81.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.81.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.82.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.82.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.82.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.82.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.82.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.82.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.83.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.83.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.83.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.83.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.83.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.83.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.84.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.84.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.84.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.84.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.84.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.84.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.85.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.85.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.85.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.85.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.85.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.85.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.86.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.86.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.86.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.86.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.86.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.86.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.87.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.87.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.87.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.87.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.87.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.87.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.88.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.88.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.88.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.88.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.88.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.88.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.89.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.89.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.89.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.89.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.89.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.89.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.9.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.9.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.9.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.9.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.9.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.9.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.90.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.90.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.90.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.90.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.90.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.90.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.91.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.91.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.91.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.91.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.91.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.91.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.92.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.92.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.92.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.92.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.92.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.92.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.93.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.93.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.93.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.93.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.93.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.93.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.94.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.94.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.94.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.94.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.94.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.94.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.95.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.95.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.95.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.95.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.95.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.95.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.96.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.96.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.96.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.96.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.96.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.96.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.97.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.97.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.97.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.97.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.97.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.97.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.98.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.98.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.98.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.98.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.98.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.98.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.99.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.99.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.99.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.99.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.99.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.experts.99.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.gate.e_score_correction_bias": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.gate.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.shared_experts.down_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.shared_experts.down_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.shared_experts.gate_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.shared_experts.gate_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.shared_experts.up_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.mlp.shared_experts.up_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.post_attention_layernorm.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.self_attn.k_norm.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.self_attn.k_proj.bias": "model-00084-of-00092.safetensors",
+ "model.layers.83.self_attn.k_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.self_attn.k_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.self_attn.o_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.self_attn.o_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.self_attn.q_norm.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.self_attn.q_proj.bias": "model-00084-of-00092.safetensors",
+ "model.layers.83.self_attn.q_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.self_attn.q_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.83.self_attn.v_proj.bias": "model-00084-of-00092.safetensors",
+ "model.layers.83.self_attn.v_proj.weight": "model-00084-of-00092.safetensors",
+ "model.layers.83.self_attn.v_proj.weight_scale": "model-00084-of-00092.safetensors",
+ "model.layers.84.input_layernorm.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.0.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.0.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.0.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.0.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.0.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.0.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.1.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.1.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.1.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.1.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.1.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.1.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.10.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.10.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.10.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.10.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.10.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.10.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.100.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.100.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.100.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.100.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.100.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.100.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.101.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.101.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.101.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.101.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.101.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.101.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.102.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.102.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.102.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.102.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.102.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.102.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.103.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.103.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.103.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.103.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.103.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.103.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.104.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.104.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.104.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.104.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.104.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.104.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.105.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.105.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.105.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.105.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.105.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.105.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.106.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.106.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.106.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.106.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.106.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.106.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.107.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.107.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.107.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.107.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.107.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.107.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.108.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.108.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.108.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.108.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.108.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.108.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.109.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.109.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.109.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.109.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.109.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.109.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.11.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.11.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.11.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.11.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.11.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.11.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.110.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.110.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.110.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.110.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.110.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.110.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.111.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.111.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.111.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.111.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.111.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.111.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.112.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.112.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.112.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.112.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.112.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.112.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.113.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.113.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.113.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.113.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.113.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.113.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.114.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.114.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.114.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.114.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.114.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.114.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.115.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.115.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.115.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.115.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.115.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.115.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.116.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.116.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.116.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.116.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.116.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.116.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.117.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.117.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.117.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.117.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.117.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.117.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.118.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.118.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.118.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.118.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.118.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.118.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.119.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.119.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.119.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.119.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.119.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.119.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.12.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.12.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.12.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.12.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.12.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.12.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.120.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.120.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.120.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.120.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.120.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.120.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.121.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.121.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.121.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.121.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.121.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.121.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.122.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.122.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.122.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.122.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.122.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.122.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.123.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.123.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.123.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.123.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.123.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.123.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.124.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.124.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.124.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.124.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.124.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.124.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.125.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.125.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.125.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.125.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.125.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.125.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.126.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.126.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.126.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.126.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.126.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.126.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.127.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.127.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.127.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.127.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.127.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.127.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.128.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.128.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.128.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.128.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.128.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.128.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.129.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.129.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.129.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.129.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.129.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.129.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.13.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.13.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.13.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.13.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.13.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.13.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.130.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.130.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.130.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.130.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.130.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.130.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.131.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.131.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.131.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.131.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.131.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.131.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.132.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.132.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.132.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.132.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.132.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.132.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.133.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.133.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.133.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.133.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.133.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.133.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.134.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.134.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.134.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.134.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.134.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.134.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.135.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.135.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.135.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.135.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.135.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.135.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.136.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.136.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.136.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.136.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.136.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.136.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.137.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.137.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.137.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.137.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.137.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.137.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.138.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.138.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.138.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.138.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.138.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.138.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.139.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.139.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.139.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.139.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.139.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.139.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.14.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.14.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.14.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.14.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.14.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.14.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.140.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.140.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.140.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.140.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.140.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.140.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.141.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.141.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.141.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.141.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.141.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.141.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.142.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.142.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.142.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.142.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.142.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.142.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.143.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.143.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.143.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.143.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.143.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.143.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.144.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.144.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.144.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.144.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.144.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.144.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.145.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.145.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.145.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.145.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.145.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.145.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.146.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.146.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.146.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.146.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.146.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.146.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.147.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.147.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.147.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.147.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.147.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.147.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.148.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.148.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.148.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.148.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.148.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.148.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.149.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.149.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.149.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.149.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.149.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.149.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.15.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.15.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.15.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.15.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.15.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.15.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.150.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.150.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.150.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.150.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.150.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.150.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.151.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.151.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.151.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.151.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.151.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.151.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.152.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.152.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.152.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.152.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.152.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.152.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.153.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.153.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.153.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.153.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.153.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.153.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.154.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.154.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.154.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.154.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.154.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.154.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.155.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.155.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.155.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.155.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.155.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.155.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.156.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.156.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.156.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.156.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.156.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.156.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.157.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.157.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.157.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.157.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.157.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.157.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.158.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.158.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.158.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.158.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.158.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.158.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.159.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.159.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.159.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.159.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.159.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.159.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.16.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.16.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.16.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.16.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.16.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.16.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.17.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.17.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.17.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.17.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.17.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.17.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.18.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.18.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.18.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.18.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.18.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.18.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.19.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.19.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.19.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.19.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.19.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.19.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.2.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.2.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.2.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.2.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.2.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.2.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.20.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.20.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.20.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.20.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.20.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.20.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.21.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.21.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.21.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.21.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.21.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.21.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.22.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.22.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.22.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.22.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.22.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.22.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.23.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.23.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.23.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.23.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.23.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.23.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.24.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.24.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.24.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.24.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.24.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.24.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.25.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.25.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.25.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.25.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.25.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.25.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.26.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.26.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.26.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.26.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.26.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.26.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.27.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.27.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.27.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.27.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.27.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.27.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.28.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.28.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.28.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.28.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.28.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.28.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.29.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.29.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.29.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.29.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.29.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.29.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.3.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.3.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.3.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.3.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.3.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.3.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.30.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.30.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.30.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.30.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.30.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.30.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.31.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.31.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.31.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.31.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.31.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.31.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.32.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.32.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.32.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.32.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.32.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.32.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.33.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.33.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.33.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.33.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.33.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.33.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.34.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.34.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.34.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.34.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.34.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.34.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.35.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.35.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.35.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.35.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.35.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.35.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.36.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.36.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.36.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.36.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.36.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.36.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.37.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.37.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.37.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.37.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.37.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.37.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.38.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.38.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.38.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.38.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.38.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.38.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.39.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.39.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.39.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.39.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.39.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.39.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.4.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.4.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.4.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.4.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.4.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.4.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.40.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.40.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.40.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.40.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.40.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.40.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.41.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.41.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.41.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.41.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.41.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.41.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.42.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.42.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.42.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.42.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.42.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.42.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.43.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.43.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.43.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.43.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.43.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.43.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.44.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.44.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.44.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.44.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.44.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.44.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.45.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.45.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.45.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.45.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.45.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.45.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.46.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.46.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.46.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.46.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.46.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.46.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.47.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.47.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.47.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.47.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.47.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.47.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.48.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.48.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.48.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.48.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.48.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.48.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.49.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.49.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.49.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.49.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.49.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.49.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.5.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.5.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.5.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.5.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.5.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.5.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.50.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.50.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.50.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.50.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.50.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.50.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.51.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.51.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.51.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.51.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.51.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.51.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.52.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.52.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.52.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.52.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.52.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.52.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.53.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.53.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.53.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.53.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.53.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.53.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.54.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.54.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.54.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.54.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.54.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.54.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.55.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.55.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.55.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.55.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.55.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.55.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.56.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.56.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.56.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.56.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.56.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.56.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.57.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.57.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.57.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.57.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.57.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.57.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.58.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.58.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.58.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.58.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.58.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.58.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.59.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.59.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.59.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.59.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.59.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.59.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.6.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.6.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.6.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.6.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.6.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.6.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.60.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.60.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.60.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.60.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.60.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.60.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.61.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.61.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.61.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.61.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.61.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.61.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.62.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.62.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.62.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.62.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.62.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.62.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.63.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.63.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.63.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.63.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.63.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.63.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.64.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.64.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.64.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.64.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.64.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.64.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.65.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.65.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.65.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.65.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.65.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.65.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.66.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.66.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.66.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.66.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.66.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.66.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.67.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.67.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.67.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.67.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.67.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.67.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.68.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.68.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.68.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.68.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.68.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.68.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.69.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.69.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.69.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.69.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.69.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.69.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.7.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.7.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.7.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.7.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.7.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.7.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.70.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.70.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.70.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.70.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.70.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.70.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.71.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.71.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.71.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.71.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.71.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.71.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.72.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.72.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.72.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.72.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.72.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.72.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.73.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.73.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.73.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.73.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.73.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.73.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.74.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.74.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.74.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.74.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.74.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.74.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.75.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.75.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.75.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.75.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.75.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.75.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.76.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.76.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.76.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.76.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.76.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.76.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.77.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.77.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.77.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.77.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.77.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.77.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.78.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.78.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.78.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.78.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.78.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.78.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.79.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.79.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.79.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.79.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.79.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.79.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.8.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.8.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.8.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.8.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.8.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.8.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.80.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.80.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.80.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.80.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.80.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.80.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.81.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.81.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.81.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.81.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.81.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.81.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.82.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.82.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.82.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.82.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.82.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.82.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.83.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.83.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.83.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.83.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.83.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.83.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.84.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.84.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.84.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.84.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.84.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.84.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.85.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.85.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.85.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.85.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.85.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.85.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.86.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.86.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.86.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.86.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.86.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.86.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.87.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.87.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.87.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.87.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.87.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.87.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.88.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.88.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.88.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.88.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.88.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.88.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.89.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.89.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.89.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.89.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.89.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.89.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.9.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.9.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.9.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.9.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.9.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.9.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.90.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.90.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.90.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.90.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.90.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.90.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.91.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.91.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.91.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.91.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.91.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.91.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.92.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.92.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.92.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.92.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.92.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.92.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.93.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.93.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.93.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.93.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.93.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.93.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.94.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.94.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.94.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.94.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.94.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.94.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.95.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.95.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.95.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.95.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.95.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.95.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.96.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.96.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.96.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.96.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.96.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.96.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.97.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.97.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.97.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.97.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.97.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.97.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.98.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.98.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.98.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.98.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.98.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.98.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.99.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.99.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.99.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.99.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.99.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.experts.99.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.gate.e_score_correction_bias": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.gate.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.shared_experts.down_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.shared_experts.down_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.shared_experts.gate_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.shared_experts.gate_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.shared_experts.up_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.mlp.shared_experts.up_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.post_attention_layernorm.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.self_attn.k_norm.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.self_attn.k_proj.bias": "model-00085-of-00092.safetensors",
+ "model.layers.84.self_attn.k_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.self_attn.k_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.self_attn.o_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.self_attn.o_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.self_attn.q_norm.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.self_attn.q_proj.bias": "model-00085-of-00092.safetensors",
+ "model.layers.84.self_attn.q_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.self_attn.q_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.84.self_attn.v_proj.bias": "model-00085-of-00092.safetensors",
+ "model.layers.84.self_attn.v_proj.weight": "model-00085-of-00092.safetensors",
+ "model.layers.84.self_attn.v_proj.weight_scale": "model-00085-of-00092.safetensors",
+ "model.layers.85.input_layernorm.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.0.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.0.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.0.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.0.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.0.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.0.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.1.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.1.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.1.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.1.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.1.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.1.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.10.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.10.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.10.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.10.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.10.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.10.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.100.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.100.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.100.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.100.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.100.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.100.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.101.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.101.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.101.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.101.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.101.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.101.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.102.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.102.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.102.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.102.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.102.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.102.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.103.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.103.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.103.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.103.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.103.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.103.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.104.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.104.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.104.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.104.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.104.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.104.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.105.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.105.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.105.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.105.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.105.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.105.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.106.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.106.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.106.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.106.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.106.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.106.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.107.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.107.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.107.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.107.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.107.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.107.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.108.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.108.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.108.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.108.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.108.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.108.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.109.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.109.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.109.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.109.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.109.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.109.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.11.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.11.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.11.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.11.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.11.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.11.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.110.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.110.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.110.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.110.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.110.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.110.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.111.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.111.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.111.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.111.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.111.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.111.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.112.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.112.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.112.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.112.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.112.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.112.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.113.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.113.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.113.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.113.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.113.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.113.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.114.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.114.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.114.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.114.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.114.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.114.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.115.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.115.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.115.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.115.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.115.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.115.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.116.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.116.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.116.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.116.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.116.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.116.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.117.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.117.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.117.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.117.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.117.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.117.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.118.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.118.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.118.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.118.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.118.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.118.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.119.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.119.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.119.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.119.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.119.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.119.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.12.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.12.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.12.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.12.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.12.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.12.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.120.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.120.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.120.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.120.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.120.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.120.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.121.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.121.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.121.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.121.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.121.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.121.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.122.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.122.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.122.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.122.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.122.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.122.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.123.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.123.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.123.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.123.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.123.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.123.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.124.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.124.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.124.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.124.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.124.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.124.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.125.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.125.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.125.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.125.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.125.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.125.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.126.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.126.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.126.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.126.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.126.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.126.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.127.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.127.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.127.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.127.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.127.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.127.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.128.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.128.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.128.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.128.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.128.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.128.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.129.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.129.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.129.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.129.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.129.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.129.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.13.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.13.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.13.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.13.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.13.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.13.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.130.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.130.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.130.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.130.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.130.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.130.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.131.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.131.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.131.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.131.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.131.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.131.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.132.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.132.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.132.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.132.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.132.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.132.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.133.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.133.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.133.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.133.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.133.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.133.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.134.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.134.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.134.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.134.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.134.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.134.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.135.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.135.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.135.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.135.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.135.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.135.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.136.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.136.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.136.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.136.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.136.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.136.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.137.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.137.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.137.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.137.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.137.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.137.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.138.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.138.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.138.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.138.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.138.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.138.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.139.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.139.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.139.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.139.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.139.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.139.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.14.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.14.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.14.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.14.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.14.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.14.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.140.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.140.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.140.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.140.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.140.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.140.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.141.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.141.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.141.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.141.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.141.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.141.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.142.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.142.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.142.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.142.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.142.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.142.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.143.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.143.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.143.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.143.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.143.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.143.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.144.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.144.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.144.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.144.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.144.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.144.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.145.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.145.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.145.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.145.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.145.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.145.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.146.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.146.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.146.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.146.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.146.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.146.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.147.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.147.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.147.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.147.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.147.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.147.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.148.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.148.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.148.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.148.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.148.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.148.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.149.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.149.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.149.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.149.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.149.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.149.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.15.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.15.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.15.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.15.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.15.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.15.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.150.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.150.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.150.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.150.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.150.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.150.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.151.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.151.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.151.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.151.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.151.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.151.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.152.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.152.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.152.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.152.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.152.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.152.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.153.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.153.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.153.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.153.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.153.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.153.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.154.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.154.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.154.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.154.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.154.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.154.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.155.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.155.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.155.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.155.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.155.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.155.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.156.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.156.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.156.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.156.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.156.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.156.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.157.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.157.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.157.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.157.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.157.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.157.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.158.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.158.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.158.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.158.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.158.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.158.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.159.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.159.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.159.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.159.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.159.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.159.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.16.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.16.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.16.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.16.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.16.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.16.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.17.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.17.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.17.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.17.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.17.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.17.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.18.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.18.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.18.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.18.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.18.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.18.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.19.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.19.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.19.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.19.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.19.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.19.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.2.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.2.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.2.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.2.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.2.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.2.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.20.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.20.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.20.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.20.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.20.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.20.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.21.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.21.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.21.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.21.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.21.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.21.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.22.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.22.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.22.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.22.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.22.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.22.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.23.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.23.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.23.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.23.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.23.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.23.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.24.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.24.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.24.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.24.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.24.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.24.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.25.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.25.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.25.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.25.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.25.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.25.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.26.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.26.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.26.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.26.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.26.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.26.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.27.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.27.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.27.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.27.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.27.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.27.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.28.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.28.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.28.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.28.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.28.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.28.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.29.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.29.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.29.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.29.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.29.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.29.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.3.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.3.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.3.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.3.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.3.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.3.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.30.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.30.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.30.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.30.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.30.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.30.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.31.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.31.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.31.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.31.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.31.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.31.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.32.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.32.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.32.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.32.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.32.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.32.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.33.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.33.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.33.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.33.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.33.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.33.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.34.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.34.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.34.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.34.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.34.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.34.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.35.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.35.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.35.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.35.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.35.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.35.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.36.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.36.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.36.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.36.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.36.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.36.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.37.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.37.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.37.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.37.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.37.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.37.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.38.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.38.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.38.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.38.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.38.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.38.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.39.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.39.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.39.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.39.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.39.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.39.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.4.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.4.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.4.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.4.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.4.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.4.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.40.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.40.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.40.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.40.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.40.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.40.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.41.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.41.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.41.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.41.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.41.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.41.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.42.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.42.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.42.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.42.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.42.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.42.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.43.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.43.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.43.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.43.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.43.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.43.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.44.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.44.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.44.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.44.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.44.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.44.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.45.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.45.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.45.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.45.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.45.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.45.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.46.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.46.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.46.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.46.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.46.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.46.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.47.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.47.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.47.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.47.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.47.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.47.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.48.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.48.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.48.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.48.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.48.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.48.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.49.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.49.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.49.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.49.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.49.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.49.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.5.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.5.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.5.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.5.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.5.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.5.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.50.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.50.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.50.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.50.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.50.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.50.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.51.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.51.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.51.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.51.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.51.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.51.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.52.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.52.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.52.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.52.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.52.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.52.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.53.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.53.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.53.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.53.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.53.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.53.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.54.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.54.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.54.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.54.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.54.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.54.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.55.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.55.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.55.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.55.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.55.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.55.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.56.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.56.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.56.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.56.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.56.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.56.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.57.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.57.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.57.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.57.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.57.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.57.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.58.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.58.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.58.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.58.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.58.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.58.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.59.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.59.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.59.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.59.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.59.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.59.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.6.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.6.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.6.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.6.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.6.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.6.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.60.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.60.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.60.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.60.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.60.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.60.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.61.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.61.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.61.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.61.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.61.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.61.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.62.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.62.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.62.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.62.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.62.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.62.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.63.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.63.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.63.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.63.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.63.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.63.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.64.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.64.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.64.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.64.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.64.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.64.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.65.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.65.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.65.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.65.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.65.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.65.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.66.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.66.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.66.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.66.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.66.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.66.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.67.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.67.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.67.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.67.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.67.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.67.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.68.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.68.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.68.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.68.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.68.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.68.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.69.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.69.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.69.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.69.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.69.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.69.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.7.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.7.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.7.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.7.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.7.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.7.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.70.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.70.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.70.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.70.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.70.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.70.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.71.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.71.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.71.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.71.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.71.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.71.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.72.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.72.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.72.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.72.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.72.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.72.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.73.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.73.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.73.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.73.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.73.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.73.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.74.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.74.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.74.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.74.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.74.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.74.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.75.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.75.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.75.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.75.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.75.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.75.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.76.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.76.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.76.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.76.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.76.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.76.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.77.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.77.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.77.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.77.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.77.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.77.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.78.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.78.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.78.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.78.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.78.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.78.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.79.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.79.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.79.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.79.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.79.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.79.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.8.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.8.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.8.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.8.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.8.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.8.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.80.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.80.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.80.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.80.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.80.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.80.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.81.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.81.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.81.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.81.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.81.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.81.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.82.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.82.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.82.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.82.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.82.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.82.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.83.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.83.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.83.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.83.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.83.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.83.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.84.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.84.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.84.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.84.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.84.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.84.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.85.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.85.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.85.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.85.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.85.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.85.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.86.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.86.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.86.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.86.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.86.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.86.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.87.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.87.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.87.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.87.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.87.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.87.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.88.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.88.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.88.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.88.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.88.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.88.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.89.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.89.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.89.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.89.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.89.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.89.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.9.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.9.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.9.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.9.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.9.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.9.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.90.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.90.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.90.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.90.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.90.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.90.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.91.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.91.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.91.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.91.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.91.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.91.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.92.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.92.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.92.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.92.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.92.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.92.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.93.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.93.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.93.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.93.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.93.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.93.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.94.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.94.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.94.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.94.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.94.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.94.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.95.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.95.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.95.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.95.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.95.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.95.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.96.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.96.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.96.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.96.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.96.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.96.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.97.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.97.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.97.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.97.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.97.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.97.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.98.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.98.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.98.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.98.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.98.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.98.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.99.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.99.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.99.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.99.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.99.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.experts.99.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.gate.e_score_correction_bias": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.gate.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.shared_experts.down_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.shared_experts.down_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.shared_experts.gate_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.shared_experts.gate_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.shared_experts.up_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.mlp.shared_experts.up_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.post_attention_layernorm.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.self_attn.k_norm.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.self_attn.k_proj.bias": "model-00086-of-00092.safetensors",
+ "model.layers.85.self_attn.k_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.self_attn.k_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.self_attn.o_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.self_attn.o_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.self_attn.q_norm.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.self_attn.q_proj.bias": "model-00086-of-00092.safetensors",
+ "model.layers.85.self_attn.q_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.self_attn.q_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.85.self_attn.v_proj.bias": "model-00086-of-00092.safetensors",
+ "model.layers.85.self_attn.v_proj.weight": "model-00086-of-00092.safetensors",
+ "model.layers.85.self_attn.v_proj.weight_scale": "model-00086-of-00092.safetensors",
+ "model.layers.86.input_layernorm.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.0.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.0.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.0.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.0.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.0.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.0.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.1.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.1.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.1.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.1.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.1.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.1.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.10.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.10.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.10.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.10.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.10.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.10.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.100.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.100.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.100.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.100.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.100.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.100.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.101.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.101.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.101.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.101.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.101.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.101.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.102.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.102.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.102.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.102.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.102.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.102.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.103.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.103.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.103.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.103.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.103.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.103.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.104.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.104.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.104.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.104.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.104.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.104.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.105.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.105.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.105.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.105.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.105.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.105.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.106.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.106.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.106.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.106.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.106.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.106.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.107.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.107.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.107.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.107.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.107.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.107.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.108.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.108.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.108.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.108.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.108.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.108.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.109.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.109.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.109.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.109.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.109.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.109.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.11.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.11.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.11.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.11.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.11.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.11.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.110.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.110.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.110.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.110.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.110.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.110.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.111.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.111.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.111.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.111.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.111.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.111.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.112.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.112.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.112.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.112.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.112.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.112.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.113.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.113.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.113.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.113.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.113.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.113.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.114.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.114.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.114.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.114.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.114.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.114.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.115.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.115.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.115.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.115.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.115.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.115.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.116.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.116.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.116.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.116.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.116.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.116.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.117.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.117.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.117.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.117.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.117.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.117.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.118.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.118.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.118.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.118.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.118.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.118.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.119.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.119.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.119.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.119.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.119.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.119.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.12.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.12.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.12.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.12.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.12.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.12.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.120.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.120.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.120.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.120.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.120.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.120.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.121.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.121.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.121.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.121.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.121.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.121.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.122.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.122.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.122.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.122.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.122.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.122.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.123.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.123.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.123.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.123.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.123.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.123.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.124.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.124.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.124.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.124.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.124.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.124.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.125.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.125.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.125.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.125.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.125.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.125.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.126.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.126.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.126.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.126.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.126.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.126.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.127.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.127.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.127.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.127.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.127.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.127.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.128.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.128.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.128.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.128.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.128.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.128.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.129.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.129.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.129.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.129.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.129.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.129.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.13.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.13.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.13.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.13.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.13.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.13.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.130.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.130.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.130.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.130.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.130.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.130.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.131.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.131.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.131.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.131.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.131.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.131.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.132.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.132.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.132.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.132.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.132.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.132.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.133.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.133.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.133.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.133.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.133.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.133.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.134.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.134.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.134.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.134.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.134.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.134.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.135.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.135.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.135.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.135.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.135.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.135.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.136.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.136.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.136.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.136.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.136.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.136.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.137.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.137.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.137.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.137.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.137.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.137.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.138.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.138.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.138.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.138.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.138.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.138.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.139.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.139.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.139.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.139.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.139.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.139.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.14.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.14.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.14.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.14.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.14.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.14.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.140.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.140.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.140.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.140.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.140.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.140.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.141.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.141.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.141.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.141.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.141.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.141.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.142.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.142.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.142.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.142.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.142.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.142.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.143.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.143.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.143.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.143.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.143.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.143.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.144.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.144.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.144.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.144.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.144.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.144.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.145.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.145.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.145.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.145.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.145.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.145.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.146.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.146.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.146.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.146.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.146.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.146.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.147.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.147.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.147.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.147.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.147.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.147.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.148.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.148.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.148.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.148.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.148.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.148.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.149.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.149.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.149.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.149.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.149.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.149.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.15.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.15.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.15.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.15.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.15.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.15.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.150.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.150.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.150.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.150.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.150.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.150.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.151.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.151.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.151.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.151.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.151.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.151.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.152.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.152.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.152.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.152.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.152.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.152.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.153.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.153.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.153.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.153.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.153.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.153.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.154.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.154.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.154.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.154.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.154.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.154.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.155.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.155.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.155.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.155.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.155.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.155.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.156.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.156.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.156.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.156.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.156.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.156.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.157.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.157.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.157.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.157.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.157.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.157.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.158.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.158.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.158.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.158.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.158.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.158.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.159.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.159.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.159.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.159.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.159.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.159.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.16.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.16.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.16.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.16.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.16.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.16.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.17.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.17.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.17.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.17.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.17.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.17.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.18.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.18.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.18.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.18.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.18.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.18.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.19.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.19.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.19.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.19.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.19.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.19.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.2.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.2.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.2.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.2.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.2.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.2.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.20.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.20.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.20.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.20.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.20.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.20.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.21.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.21.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.21.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.21.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.21.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.21.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.22.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.22.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.22.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.22.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.22.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.22.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.23.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.23.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.23.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.23.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.23.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.23.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.24.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.24.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.24.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.24.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.24.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.24.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.25.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.25.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.25.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.25.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.25.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.25.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.26.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.26.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.26.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.26.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.26.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.26.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.27.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.27.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.27.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.27.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.27.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.27.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.28.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.28.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.28.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.28.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.28.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.28.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.29.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.29.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.29.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.29.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.29.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.29.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.3.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.3.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.3.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.3.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.3.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.3.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.30.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.30.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.30.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.30.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.30.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.30.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.31.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.31.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.31.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.31.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.31.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.31.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.32.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.32.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.32.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.32.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.32.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.32.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.33.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.33.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.33.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.33.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.33.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.33.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.34.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.34.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.34.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.34.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.34.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.34.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.35.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.35.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.35.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.35.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.35.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.35.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.36.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.36.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.36.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.36.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.36.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.36.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.37.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.37.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.37.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.37.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.37.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.37.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.38.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.38.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.38.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.38.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.38.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.38.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.39.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.39.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.39.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.39.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.39.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.39.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.4.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.4.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.4.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.4.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.4.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.4.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.40.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.40.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.40.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.40.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.40.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.40.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.41.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.41.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.41.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.41.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.41.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.41.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.42.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.42.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.42.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.42.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.42.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.42.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.43.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.43.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.43.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.43.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.43.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.43.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.44.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.44.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.44.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.44.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.44.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.44.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.45.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.45.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.45.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.45.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.45.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.45.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.46.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.46.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.46.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.46.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.46.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.46.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.47.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.47.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.47.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.47.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.47.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.47.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.48.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.48.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.48.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.48.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.48.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.48.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.49.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.49.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.49.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.49.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.49.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.49.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.5.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.5.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.5.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.5.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.5.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.5.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.50.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.50.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.50.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.50.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.50.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.50.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.51.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.51.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.51.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.51.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.51.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.51.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.52.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.52.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.52.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.52.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.52.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.52.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.53.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.53.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.53.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.53.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.53.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.53.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.54.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.54.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.54.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.54.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.54.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.54.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.55.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.55.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.55.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.55.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.55.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.55.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.56.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.56.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.56.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.56.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.56.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.56.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.57.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.57.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.57.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.57.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.57.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.57.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.58.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.58.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.58.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.58.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.58.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.58.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.59.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.59.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.59.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.59.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.59.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.59.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.6.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.6.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.6.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.6.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.6.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.6.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.60.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.60.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.60.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.60.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.60.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.60.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.61.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.61.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.61.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.61.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.61.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.61.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.62.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.62.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.62.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.62.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.62.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.62.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.63.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.63.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.63.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.63.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.63.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.63.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.64.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.64.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.64.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.64.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.64.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.64.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.65.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.65.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.65.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.65.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.65.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.65.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.66.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.66.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.66.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.66.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.66.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.66.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.67.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.67.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.67.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.67.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.67.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.67.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.68.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.68.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.68.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.68.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.68.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.68.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.69.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.69.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.69.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.69.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.69.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.69.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.7.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.7.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.7.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.7.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.7.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.7.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.70.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.70.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.70.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.70.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.70.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.70.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.71.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.71.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.71.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.71.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.71.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.71.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.72.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.72.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.72.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.72.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.72.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.72.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.73.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.73.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.73.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.73.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.73.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.73.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.74.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.74.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.74.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.74.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.74.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.74.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.75.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.75.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.75.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.75.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.75.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.75.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.76.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.76.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.76.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.76.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.76.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.76.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.77.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.77.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.77.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.77.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.77.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.77.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.78.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.78.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.78.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.78.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.78.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.78.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.79.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.79.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.79.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.79.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.79.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.79.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.8.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.8.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.8.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.8.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.8.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.8.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.80.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.80.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.80.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.80.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.80.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.80.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.81.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.81.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.81.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.81.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.81.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.81.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.82.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.82.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.82.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.82.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.82.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.82.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.83.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.83.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.83.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.83.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.83.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.83.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.84.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.84.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.84.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.84.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.84.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.84.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.85.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.85.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.85.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.85.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.85.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.85.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.86.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.86.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.86.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.86.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.86.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.86.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.87.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.87.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.87.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.87.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.87.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.87.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.88.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.88.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.88.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.88.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.88.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.88.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.89.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.89.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.89.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.89.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.89.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.89.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.9.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.9.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.9.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.9.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.9.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.9.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.90.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.90.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.90.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.90.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.90.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.90.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.91.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.91.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.91.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.91.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.91.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.91.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.92.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.92.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.92.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.92.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.92.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.92.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.93.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.93.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.93.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.93.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.93.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.93.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.94.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.94.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.94.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.94.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.94.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.94.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.95.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.95.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.95.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.95.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.95.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.95.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.96.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.96.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.96.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.96.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.96.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.96.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.97.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.97.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.97.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.97.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.97.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.97.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.98.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.98.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.98.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.98.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.98.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.98.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.99.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.99.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.99.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.99.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.99.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.experts.99.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.gate.e_score_correction_bias": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.gate.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.shared_experts.down_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.shared_experts.down_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.shared_experts.gate_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.shared_experts.gate_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.shared_experts.up_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.mlp.shared_experts.up_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.post_attention_layernorm.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.self_attn.k_norm.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.self_attn.k_proj.bias": "model-00087-of-00092.safetensors",
+ "model.layers.86.self_attn.k_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.self_attn.k_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.self_attn.o_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.self_attn.o_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.self_attn.q_norm.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.self_attn.q_proj.bias": "model-00087-of-00092.safetensors",
+ "model.layers.86.self_attn.q_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.self_attn.q_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.86.self_attn.v_proj.bias": "model-00087-of-00092.safetensors",
+ "model.layers.86.self_attn.v_proj.weight": "model-00087-of-00092.safetensors",
+ "model.layers.86.self_attn.v_proj.weight_scale": "model-00087-of-00092.safetensors",
+ "model.layers.87.input_layernorm.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.0.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.0.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.0.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.0.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.0.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.0.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.1.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.1.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.1.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.1.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.1.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.1.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.10.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.10.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.10.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.10.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.10.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.10.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.100.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.100.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.100.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.100.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.100.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.100.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.101.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.101.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.101.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.101.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.101.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.101.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.102.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.102.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.102.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.102.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.102.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.102.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.103.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.103.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.103.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.103.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.103.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.103.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.104.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.104.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.104.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.104.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.104.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.104.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.105.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.105.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.105.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.105.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.105.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.105.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.106.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.106.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.106.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.106.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.106.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.106.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.107.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.107.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.107.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.107.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.107.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.107.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.108.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.108.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.108.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.108.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.108.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.108.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.109.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.109.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.109.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.109.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.109.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.109.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.11.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.11.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.11.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.11.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.11.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.11.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.110.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.110.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.110.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.110.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.110.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.110.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.111.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.111.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.111.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.111.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.111.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.111.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.112.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.112.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.112.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.112.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.112.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.112.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.113.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.113.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.113.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.113.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.113.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.113.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.114.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.114.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.114.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.114.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.114.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.114.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.115.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.115.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.115.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.115.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.115.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.115.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.116.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.116.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.116.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.116.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.116.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.116.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.117.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.117.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.117.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.117.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.117.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.117.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.118.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.118.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.118.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.118.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.118.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.118.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.119.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.119.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.119.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.119.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.119.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.119.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.12.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.12.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.12.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.12.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.12.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.12.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.120.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.120.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.120.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.120.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.120.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.120.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.121.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.121.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.121.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.121.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.121.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.121.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.122.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.122.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.122.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.122.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.122.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.122.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.123.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.123.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.123.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.123.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.123.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.123.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.124.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.124.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.124.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.124.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.124.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.124.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.125.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.125.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.125.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.125.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.125.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.125.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.126.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.126.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.126.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.126.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.126.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.126.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.127.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.127.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.127.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.127.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.127.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.127.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.128.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.128.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.128.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.128.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.128.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.128.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.129.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.129.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.129.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.129.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.129.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.129.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.13.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.13.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.13.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.13.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.13.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.13.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.130.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.130.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.130.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.130.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.130.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.130.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.131.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.131.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.131.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.131.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.131.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.131.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.132.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.132.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.132.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.132.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.132.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.132.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.133.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.133.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.133.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.133.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.133.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.133.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.134.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.134.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.134.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.134.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.134.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.134.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.135.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.135.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.135.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.135.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.135.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.135.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.136.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.136.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.136.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.136.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.136.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.136.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.137.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.137.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.137.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.137.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.137.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.137.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.138.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.138.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.138.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.138.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.138.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.138.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.139.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.139.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.139.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.139.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.139.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.139.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.14.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.14.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.14.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.14.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.14.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.14.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.140.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.140.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.140.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.140.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.140.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.140.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.141.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.141.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.141.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.141.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.141.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.141.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.142.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.142.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.142.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.142.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.142.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.142.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.143.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.143.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.143.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.143.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.143.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.143.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.144.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.144.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.144.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.144.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.144.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.144.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.145.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.145.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.145.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.145.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.145.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.145.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.146.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.146.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.146.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.146.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.146.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.146.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.147.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.147.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.147.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.147.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.147.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.147.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.148.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.148.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.148.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.148.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.148.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.148.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.149.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.149.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.149.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.149.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.149.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.149.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.15.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.15.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.15.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.15.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.15.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.15.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.150.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.150.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.150.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.150.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.150.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.150.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.151.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.151.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.151.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.151.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.151.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.151.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.152.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.152.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.152.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.152.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.152.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.152.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.153.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.153.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.153.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.153.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.153.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.153.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.154.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.154.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.154.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.154.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.154.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.154.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.155.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.155.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.155.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.155.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.155.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.155.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.156.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.156.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.156.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.156.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.156.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.156.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.157.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.157.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.157.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.157.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.157.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.157.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.158.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.158.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.158.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.158.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.158.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.158.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.159.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.159.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.159.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.159.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.159.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.159.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.16.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.16.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.16.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.16.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.16.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.16.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.17.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.17.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.17.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.17.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.17.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.17.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.18.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.18.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.18.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.18.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.18.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.18.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.19.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.19.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.19.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.19.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.19.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.19.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.2.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.2.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.2.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.2.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.2.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.2.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.20.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.20.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.20.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.20.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.20.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.20.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.21.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.21.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.21.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.21.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.21.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.21.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.22.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.22.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.22.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.22.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.22.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.22.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.23.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.23.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.23.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.23.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.23.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.23.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.24.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.24.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.24.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.24.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.24.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.24.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.25.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.25.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.25.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.25.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.25.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.25.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.26.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.26.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.26.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.26.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.26.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.26.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.27.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.27.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.27.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.27.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.27.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.27.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.28.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.28.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.28.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.28.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.28.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.28.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.29.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.29.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.29.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.29.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.29.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.29.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.3.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.3.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.3.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.3.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.3.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.3.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.30.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.30.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.30.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.30.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.30.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.30.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.31.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.31.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.31.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.31.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.31.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.31.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.32.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.32.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.32.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.32.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.32.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.32.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.33.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.33.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.33.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.33.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.33.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.33.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.34.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.34.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.34.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.34.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.34.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.34.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.35.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.35.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.35.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.35.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.35.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.35.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.36.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.36.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.36.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.36.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.36.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.36.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.37.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.37.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.37.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.37.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.37.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.37.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.38.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.38.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.38.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.38.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.38.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.38.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.39.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.39.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.39.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.39.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.39.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.39.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.4.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.4.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.4.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.4.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.4.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.4.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.40.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.40.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.40.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.40.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.40.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.40.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.41.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.41.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.41.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.41.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.41.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.41.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.42.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.42.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.42.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.42.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.42.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.42.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.43.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.43.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.43.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.43.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.43.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.43.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.44.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.44.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.44.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.44.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.44.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.44.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.45.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.45.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.45.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.45.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.45.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.45.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.46.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.46.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.46.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.46.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.46.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.46.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.47.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.47.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.47.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.47.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.47.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.47.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.48.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.48.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.48.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.48.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.48.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.48.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.49.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.49.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.49.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.49.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.49.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.49.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.5.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.5.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.5.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.5.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.5.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.5.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.50.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.50.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.50.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.50.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.50.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.50.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.51.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.51.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.51.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.51.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.51.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.51.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.52.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.52.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.52.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.52.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.52.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.52.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.53.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.53.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.53.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.53.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.53.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.53.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.54.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.54.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.54.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.54.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.54.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.54.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.55.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.55.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.55.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.55.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.55.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.55.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.56.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.56.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.56.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.56.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.56.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.56.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.57.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.57.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.57.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.57.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.57.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.57.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.58.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.58.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.58.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.58.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.58.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.58.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.59.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.59.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.59.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.59.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.59.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.59.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.6.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.6.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.6.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.6.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.6.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.6.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.60.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.60.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.60.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.60.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.60.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.60.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.61.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.61.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.61.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.61.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.61.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.61.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.62.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.62.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.62.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.62.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.62.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.62.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.63.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.63.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.63.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.63.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.63.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.63.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.64.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.64.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.64.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.64.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.64.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.64.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.65.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.65.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.65.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.65.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.65.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.65.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.66.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.66.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.66.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.66.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.66.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.66.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.67.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.67.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.67.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.67.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.67.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.67.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.68.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.68.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.68.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.68.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.68.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.68.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.69.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.69.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.69.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.69.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.69.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.69.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.7.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.7.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.7.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.7.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.7.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.7.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.70.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.70.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.70.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.70.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.70.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.70.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.71.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.71.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.71.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.71.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.71.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.71.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.72.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.72.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.72.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.72.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.72.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.72.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.73.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.73.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.73.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.73.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.73.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.73.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.74.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.74.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.74.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.74.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.74.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.74.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.75.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.75.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.75.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.75.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.75.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.75.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.76.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.76.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.76.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.76.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.76.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.76.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.77.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.77.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.77.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.77.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.77.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.77.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.78.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.78.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.78.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.78.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.78.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.78.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.79.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.79.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.79.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.79.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.79.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.79.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.8.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.8.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.8.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.8.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.8.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.8.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.80.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.80.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.80.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.80.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.80.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.80.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.81.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.81.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.81.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.81.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.81.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.81.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.82.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.82.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.82.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.82.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.82.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.82.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.83.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.83.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.83.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.83.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.83.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.83.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.84.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.84.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.84.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.84.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.84.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.84.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.85.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.85.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.85.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.85.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.85.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.85.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.86.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.86.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.86.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.86.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.86.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.86.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.87.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.87.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.87.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.87.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.87.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.87.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.88.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.88.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.88.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.88.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.88.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.88.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.89.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.89.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.89.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.89.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.89.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.89.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.9.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.9.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.9.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.9.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.9.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.9.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.90.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.90.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.90.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.90.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.90.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.90.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.91.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.91.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.91.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.91.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.91.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.91.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.92.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.92.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.92.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.92.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.92.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.92.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.93.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.93.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.93.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.93.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.93.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.93.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.94.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.94.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.94.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.94.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.94.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.94.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.95.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.95.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.95.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.95.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.95.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.95.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.96.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.96.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.96.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.96.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.96.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.96.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.97.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.97.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.97.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.97.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.97.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.97.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.98.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.98.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.98.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.98.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.98.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.98.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.99.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.99.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.99.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.99.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.99.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.experts.99.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.gate.e_score_correction_bias": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.gate.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.shared_experts.down_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.shared_experts.down_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.shared_experts.gate_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.shared_experts.gate_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.shared_experts.up_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.mlp.shared_experts.up_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.post_attention_layernorm.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.self_attn.k_norm.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.self_attn.k_proj.bias": "model-00088-of-00092.safetensors",
+ "model.layers.87.self_attn.k_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.self_attn.k_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.self_attn.o_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.self_attn.o_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.self_attn.q_norm.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.self_attn.q_proj.bias": "model-00088-of-00092.safetensors",
+ "model.layers.87.self_attn.q_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.self_attn.q_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.87.self_attn.v_proj.bias": "model-00088-of-00092.safetensors",
+ "model.layers.87.self_attn.v_proj.weight": "model-00088-of-00092.safetensors",
+ "model.layers.87.self_attn.v_proj.weight_scale": "model-00088-of-00092.safetensors",
+ "model.layers.88.input_layernorm.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.0.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.0.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.0.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.0.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.0.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.0.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.1.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.1.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.1.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.1.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.1.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.1.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.10.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.10.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.10.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.10.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.10.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.10.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.100.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.100.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.100.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.100.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.100.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.100.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.101.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.101.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.101.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.101.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.101.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.101.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.102.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.102.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.102.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.102.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.102.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.102.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.103.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.103.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.103.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.103.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.103.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.103.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.104.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.104.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.104.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.104.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.104.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.104.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.105.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.105.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.105.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.105.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.105.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.105.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.106.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.106.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.106.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.106.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.106.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.106.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.107.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.107.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.107.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.107.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.107.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.107.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.108.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.108.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.108.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.108.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.108.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.108.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.109.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.109.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.109.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.109.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.109.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.109.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.11.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.11.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.11.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.11.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.11.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.11.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.110.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.110.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.110.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.110.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.110.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.110.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.111.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.111.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.111.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.111.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.111.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.111.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.112.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.112.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.112.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.112.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.112.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.112.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.113.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.113.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.113.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.113.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.113.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.113.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.114.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.114.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.114.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.114.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.114.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.114.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.115.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.115.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.115.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.115.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.115.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.115.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.116.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.116.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.116.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.116.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.116.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.116.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.117.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.117.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.117.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.117.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.117.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.117.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.118.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.118.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.118.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.118.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.118.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.118.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.119.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.119.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.119.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.119.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.119.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.119.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.12.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.12.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.12.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.12.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.12.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.12.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.120.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.120.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.120.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.120.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.120.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.120.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.121.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.121.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.121.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.121.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.121.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.121.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.122.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.122.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.122.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.122.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.122.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.122.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.123.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.123.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.123.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.123.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.123.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.123.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.124.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.124.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.124.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.124.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.124.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.124.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.125.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.125.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.125.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.125.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.125.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.125.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.126.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.126.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.126.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.126.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.126.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.126.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.127.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.127.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.127.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.127.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.127.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.127.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.128.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.128.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.128.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.128.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.128.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.128.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.129.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.129.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.129.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.129.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.129.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.129.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.13.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.13.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.13.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.13.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.13.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.13.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.130.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.130.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.130.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.130.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.130.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.130.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.131.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.131.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.131.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.131.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.131.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.131.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.132.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.132.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.132.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.132.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.132.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.132.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.133.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.133.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.133.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.133.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.133.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.133.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.134.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.134.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.134.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.134.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.134.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.134.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.135.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.135.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.135.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.135.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.135.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.135.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.136.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.136.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.136.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.136.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.136.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.136.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.137.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.137.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.137.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.137.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.137.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.137.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.138.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.138.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.138.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.138.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.138.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.138.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.139.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.139.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.139.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.139.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.139.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.139.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.14.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.14.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.14.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.14.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.14.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.14.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.140.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.140.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.140.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.140.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.140.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.140.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.141.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.141.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.141.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.141.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.141.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.141.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.142.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.142.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.142.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.142.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.142.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.142.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.143.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.143.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.143.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.143.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.143.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.143.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.144.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.144.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.144.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.144.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.144.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.144.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.145.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.145.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.145.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.145.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.145.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.145.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.146.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.146.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.146.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.146.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.146.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.146.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.147.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.147.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.147.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.147.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.147.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.147.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.148.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.148.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.148.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.148.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.148.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.148.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.149.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.149.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.149.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.149.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.149.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.149.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.15.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.15.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.15.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.15.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.15.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.15.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.150.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.150.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.150.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.150.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.150.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.150.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.151.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.151.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.151.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.151.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.151.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.151.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.152.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.152.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.152.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.152.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.152.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.152.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.153.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.153.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.153.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.153.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.153.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.153.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.154.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.154.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.154.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.154.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.154.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.154.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.155.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.155.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.155.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.155.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.155.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.155.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.156.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.156.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.156.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.156.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.156.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.156.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.157.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.157.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.157.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.157.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.157.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.157.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.158.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.158.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.158.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.158.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.158.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.158.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.159.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.159.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.159.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.159.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.159.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.159.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.16.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.16.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.16.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.16.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.16.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.16.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.17.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.17.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.17.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.17.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.17.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.17.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.18.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.18.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.18.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.18.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.18.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.18.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.19.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.19.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.19.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.19.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.19.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.19.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.2.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.2.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.2.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.2.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.2.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.2.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.20.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.20.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.20.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.20.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.20.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.20.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.21.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.21.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.21.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.21.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.21.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.21.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.22.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.22.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.22.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.22.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.22.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.22.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.23.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.23.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.23.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.23.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.23.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.23.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.24.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.24.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.24.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.24.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.24.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.24.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.25.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.25.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.25.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.25.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.25.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.25.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.26.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.26.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.26.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.26.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.26.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.26.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.27.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.27.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.27.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.27.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.27.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.27.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.28.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.28.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.28.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.28.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.28.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.28.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.29.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.29.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.29.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.29.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.29.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.29.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.3.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.3.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.3.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.3.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.3.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.3.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.30.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.30.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.30.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.30.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.30.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.30.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.31.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.31.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.31.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.31.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.31.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.31.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.32.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.32.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.32.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.32.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.32.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.32.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.33.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.33.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.33.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.33.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.33.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.33.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.34.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.34.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.34.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.34.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.34.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.34.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.35.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.35.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.35.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.35.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.35.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.35.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.36.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.36.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.36.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.36.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.36.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.36.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.37.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.37.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.37.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.37.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.37.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.37.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.38.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.38.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.38.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.38.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.38.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.38.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.39.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.39.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.39.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.39.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.39.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.39.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.4.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.4.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.4.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.4.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.4.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.4.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.40.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.40.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.40.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.40.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.40.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.40.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.41.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.41.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.41.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.41.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.41.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.41.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.42.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.42.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.42.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.42.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.42.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.42.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.43.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.43.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.43.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.43.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.43.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.43.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.44.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.44.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.44.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.44.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.44.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.44.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.45.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.45.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.45.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.45.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.45.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.45.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.46.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.46.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.46.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.46.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.46.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.46.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.47.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.47.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.47.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.47.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.47.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.47.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.48.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.48.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.48.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.48.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.48.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.48.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.49.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.49.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.49.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.49.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.49.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.49.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.5.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.5.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.5.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.5.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.5.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.5.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.50.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.50.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.50.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.50.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.50.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.50.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.51.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.51.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.51.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.51.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.51.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.51.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.52.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.52.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.52.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.52.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.52.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.52.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.53.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.53.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.53.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.53.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.53.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.53.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.54.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.54.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.54.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.54.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.54.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.54.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.55.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.55.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.55.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.55.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.55.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.55.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.56.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.56.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.56.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.56.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.56.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.56.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.57.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.57.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.57.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.57.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.57.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.57.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.58.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.58.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.58.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.58.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.58.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.58.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.59.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.59.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.59.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.59.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.59.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.59.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.6.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.6.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.6.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.6.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.6.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.6.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.60.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.60.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.60.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.60.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.60.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.60.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.61.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.61.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.61.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.61.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.61.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.61.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.62.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.62.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.62.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.62.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.62.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.62.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.63.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.63.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.63.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.63.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.63.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.63.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.64.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.64.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.64.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.64.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.64.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.64.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.65.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.65.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.65.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.65.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.65.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.65.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.66.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.66.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.66.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.66.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.66.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.66.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.67.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.67.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.67.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.67.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.67.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.67.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.68.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.68.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.68.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.68.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.68.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.68.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.69.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.69.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.69.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.69.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.69.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.69.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.7.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.7.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.7.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.7.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.7.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.7.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.70.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.70.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.70.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.70.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.70.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.70.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.71.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.71.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.71.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.71.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.71.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.71.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.72.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.72.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.72.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.72.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.72.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.72.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.73.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.73.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.73.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.73.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.73.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.73.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.74.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.74.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.74.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.74.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.74.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.74.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.75.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.75.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.75.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.75.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.75.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.75.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.76.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.76.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.76.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.76.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.76.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.76.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.77.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.77.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.77.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.77.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.77.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.77.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.78.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.78.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.78.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.78.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.78.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.78.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.79.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.79.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.79.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.79.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.79.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.79.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.8.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.8.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.8.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.8.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.8.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.8.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.80.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.80.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.80.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.80.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.80.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.80.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.81.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.81.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.81.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.81.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.81.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.81.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.82.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.82.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.82.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.82.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.82.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.82.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.83.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.83.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.83.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.83.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.83.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.83.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.84.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.84.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.84.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.84.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.84.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.84.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.85.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.85.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.85.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.85.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.85.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.85.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.86.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.86.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.86.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.86.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.86.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.86.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.87.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.87.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.87.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.87.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.87.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.87.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.88.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.88.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.88.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.88.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.88.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.88.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.89.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.89.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.89.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.89.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.89.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.89.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.9.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.9.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.9.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.9.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.9.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.9.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.90.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.90.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.90.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.90.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.90.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.90.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.91.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.91.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.91.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.91.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.91.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.91.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.92.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.92.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.92.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.92.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.92.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.92.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.93.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.93.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.93.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.93.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.93.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.93.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.94.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.94.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.94.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.94.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.94.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.94.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.95.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.95.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.95.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.95.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.95.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.95.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.96.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.96.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.96.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.96.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.96.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.96.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.97.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.97.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.97.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.97.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.97.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.97.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.98.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.98.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.98.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.98.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.98.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.98.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.99.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.99.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.99.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.99.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.99.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.experts.99.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.gate.e_score_correction_bias": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.gate.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.shared_experts.down_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.shared_experts.down_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.shared_experts.gate_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.shared_experts.gate_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.shared_experts.up_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.mlp.shared_experts.up_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.post_attention_layernorm.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.self_attn.k_norm.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.self_attn.k_proj.bias": "model-00089-of-00092.safetensors",
+ "model.layers.88.self_attn.k_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.self_attn.k_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.self_attn.o_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.self_attn.o_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.self_attn.q_norm.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.self_attn.q_proj.bias": "model-00089-of-00092.safetensors",
+ "model.layers.88.self_attn.q_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.self_attn.q_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.88.self_attn.v_proj.bias": "model-00089-of-00092.safetensors",
+ "model.layers.88.self_attn.v_proj.weight": "model-00089-of-00092.safetensors",
+ "model.layers.88.self_attn.v_proj.weight_scale": "model-00089-of-00092.safetensors",
+ "model.layers.89.input_layernorm.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.0.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.0.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.0.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.0.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.0.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.0.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.1.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.1.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.1.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.1.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.1.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.1.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.10.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.10.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.10.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.10.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.10.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.10.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.100.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.100.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.100.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.100.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.100.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.100.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.101.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.101.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.101.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.101.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.101.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.101.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.102.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.102.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.102.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.102.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.102.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.102.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.103.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.103.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.103.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.103.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.103.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.103.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.104.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.104.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.104.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.104.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.104.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.104.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.105.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.105.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.105.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.105.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.105.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.105.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.106.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.106.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.106.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.106.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.106.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.106.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.107.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.107.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.107.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.107.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.107.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.107.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.108.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.108.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.108.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.108.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.108.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.108.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.109.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.109.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.109.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.109.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.109.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.109.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.11.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.11.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.11.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.11.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.11.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.11.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.110.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.110.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.110.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.110.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.110.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.110.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.111.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.111.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.111.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.111.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.111.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.111.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.112.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.112.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.112.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.112.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.112.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.112.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.113.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.113.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.113.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.113.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.113.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.113.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.114.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.114.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.114.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.114.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.114.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.114.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.115.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.115.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.115.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.115.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.115.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.115.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.116.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.116.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.116.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.116.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.116.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.116.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.117.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.117.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.117.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.117.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.117.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.117.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.118.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.118.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.118.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.118.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.118.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.118.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.119.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.119.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.119.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.119.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.119.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.119.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.12.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.12.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.12.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.12.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.12.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.12.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.120.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.120.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.120.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.120.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.120.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.120.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.121.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.121.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.121.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.121.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.121.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.121.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.122.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.122.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.122.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.122.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.122.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.122.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.123.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.123.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.123.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.123.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.123.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.123.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.124.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.124.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.124.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.124.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.124.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.124.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.125.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.125.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.125.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.125.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.125.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.125.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.126.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.126.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.126.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.126.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.126.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.126.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.127.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.127.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.127.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.127.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.127.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.127.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.128.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.128.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.128.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.128.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.128.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.128.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.129.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.129.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.129.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.129.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.129.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.129.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.13.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.13.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.13.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.13.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.13.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.13.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.130.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.130.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.130.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.130.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.130.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.130.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.131.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.131.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.131.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.131.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.131.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.131.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.132.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.132.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.132.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.132.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.132.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.132.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.133.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.133.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.133.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.133.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.133.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.133.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.134.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.134.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.134.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.134.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.134.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.134.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.135.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.135.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.135.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.135.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.135.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.135.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.136.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.136.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.136.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.136.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.136.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.136.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.137.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.137.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.137.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.137.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.137.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.137.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.138.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.138.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.138.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.138.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.138.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.138.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.139.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.139.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.139.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.139.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.139.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.139.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.14.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.14.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.14.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.14.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.14.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.14.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.140.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.140.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.140.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.140.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.140.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.140.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.141.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.141.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.141.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.141.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.141.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.141.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.142.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.142.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.142.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.142.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.142.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.142.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.143.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.143.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.143.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.143.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.143.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.143.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.144.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.144.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.144.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.144.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.144.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.144.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.145.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.145.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.145.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.145.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.145.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.145.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.146.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.146.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.146.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.146.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.146.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.146.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.147.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.147.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.147.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.147.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.147.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.147.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.148.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.148.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.148.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.148.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.148.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.148.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.149.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.149.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.149.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.149.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.149.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.149.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.15.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.15.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.15.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.15.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.15.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.15.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.150.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.150.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.150.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.150.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.150.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.150.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.151.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.151.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.151.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.151.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.151.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.151.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.152.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.152.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.152.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.152.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.152.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.152.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.153.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.153.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.153.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.153.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.153.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.153.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.154.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.154.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.154.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.154.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.154.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.154.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.155.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.155.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.155.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.155.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.155.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.155.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.156.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.156.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.156.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.156.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.156.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.156.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.157.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.157.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.157.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.157.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.157.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.157.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.158.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.158.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.158.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.158.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.158.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.158.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.159.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.159.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.159.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.159.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.159.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.159.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.16.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.16.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.16.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.16.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.16.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.16.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.17.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.17.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.17.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.17.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.17.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.17.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.18.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.18.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.18.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.18.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.18.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.18.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.19.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.19.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.19.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.19.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.19.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.19.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.2.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.2.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.2.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.2.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.2.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.2.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.20.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.20.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.20.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.20.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.20.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.20.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.21.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.21.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.21.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.21.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.21.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.21.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.22.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.22.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.22.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.22.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.22.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.22.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.23.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.23.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.23.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.23.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.23.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.23.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.24.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.24.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.24.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.24.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.24.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.24.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.25.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.25.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.25.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.25.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.25.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.25.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.26.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.26.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.26.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.26.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.26.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.26.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.27.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.27.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.27.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.27.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.27.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.27.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.28.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.28.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.28.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.28.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.28.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.28.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.29.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.29.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.29.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.29.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.29.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.29.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.3.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.3.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.3.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.3.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.3.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.3.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.30.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.30.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.30.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.30.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.30.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.30.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.31.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.31.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.31.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.31.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.31.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.31.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.32.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.32.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.32.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.32.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.32.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.32.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.33.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.33.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.33.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.33.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.33.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.33.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.34.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.34.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.34.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.34.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.34.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.34.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.35.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.35.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.35.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.35.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.35.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.35.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.36.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.36.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.36.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.36.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.36.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.36.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.37.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.37.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.37.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.37.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.37.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.37.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.38.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.38.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.38.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.38.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.38.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.38.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.39.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.39.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.39.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.39.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.39.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.39.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.4.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.4.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.4.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.4.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.4.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.4.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.40.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.40.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.40.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.40.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.40.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.40.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.41.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.41.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.41.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.41.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.41.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.41.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.42.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.42.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.42.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.42.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.42.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.42.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.43.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.43.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.43.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.43.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.43.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.43.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.44.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.44.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.44.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.44.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.44.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.44.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.45.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.45.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.45.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.45.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.45.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.45.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.46.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.46.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.46.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.46.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.46.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.46.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.47.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.47.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.47.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.47.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.47.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.47.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.48.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.48.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.48.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.48.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.48.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.48.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.49.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.49.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.49.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.49.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.49.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.49.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.5.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.5.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.5.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.5.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.5.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.5.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.50.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.50.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.50.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.50.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.50.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.50.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.51.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.51.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.51.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.51.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.51.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.51.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.52.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.52.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.52.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.52.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.52.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.52.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.53.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.53.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.53.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.53.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.53.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.53.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.54.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.54.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.54.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.54.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.54.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.54.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.55.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.55.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.55.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.55.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.55.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.55.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.56.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.56.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.56.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.56.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.56.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.56.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.57.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.57.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.57.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.57.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.57.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.57.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.58.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.58.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.58.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.58.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.58.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.58.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.59.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.59.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.59.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.59.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.59.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.59.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.6.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.6.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.6.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.6.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.6.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.6.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.60.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.60.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.60.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.60.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.60.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.60.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.61.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.61.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.61.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.61.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.61.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.61.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.62.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.62.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.62.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.62.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.62.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.62.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.63.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.63.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.63.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.63.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.63.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.63.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.64.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.64.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.64.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.64.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.64.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.64.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.65.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.65.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.65.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.65.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.65.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.65.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.66.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.66.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.66.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.66.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.66.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.66.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.67.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.67.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.67.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.67.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.67.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.67.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.68.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.68.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.68.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.68.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.68.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.68.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.69.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.69.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.69.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.69.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.69.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.69.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.7.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.7.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.7.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.7.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.7.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.7.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.70.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.70.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.70.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.70.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.70.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.70.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.71.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.71.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.71.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.71.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.71.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.71.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.72.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.72.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.72.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.72.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.72.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.72.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.73.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.73.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.73.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.73.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.73.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.73.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.74.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.74.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.74.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.74.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.74.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.74.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.75.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.75.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.75.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.75.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.75.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.75.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.76.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.76.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.76.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.76.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.76.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.76.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.77.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.77.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.77.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.77.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.77.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.77.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.78.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.78.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.78.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.78.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.78.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.78.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.79.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.79.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.79.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.79.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.79.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.79.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.8.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.8.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.8.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.8.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.8.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.8.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.80.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.80.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.80.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.80.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.80.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.80.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.81.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.81.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.81.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.81.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.81.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.81.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.82.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.82.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.82.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.82.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.82.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.82.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.83.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.83.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.83.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.83.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.83.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.83.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.84.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.84.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.84.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.84.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.84.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.84.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.85.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.85.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.85.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.85.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.85.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.85.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.86.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.86.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.86.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.86.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.86.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.86.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.87.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.87.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.87.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.87.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.87.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.87.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.88.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.88.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.88.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.88.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.88.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.88.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.89.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.89.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.89.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.89.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.89.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.89.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.9.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.9.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.9.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.9.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.9.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.9.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.90.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.90.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.90.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.90.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.90.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.90.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.91.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.91.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.91.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.91.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.91.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.91.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.92.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.92.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.92.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.92.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.92.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.92.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.93.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.93.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.93.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.93.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.93.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.93.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.94.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.94.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.94.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.94.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.94.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.94.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.95.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.95.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.95.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.95.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.95.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.95.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.96.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.96.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.96.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.96.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.96.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.96.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.97.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.97.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.97.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.97.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.97.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.97.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.98.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.98.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.98.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.98.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.98.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.98.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.99.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.99.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.99.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.99.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.99.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.experts.99.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.gate.e_score_correction_bias": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.gate.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.shared_experts.down_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.shared_experts.down_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.shared_experts.gate_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.shared_experts.gate_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.shared_experts.up_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.mlp.shared_experts.up_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.post_attention_layernorm.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.self_attn.k_norm.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.self_attn.k_proj.bias": "model-00090-of-00092.safetensors",
+ "model.layers.89.self_attn.k_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.self_attn.k_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.self_attn.o_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.self_attn.o_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.self_attn.q_norm.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.self_attn.q_proj.bias": "model-00090-of-00092.safetensors",
+ "model.layers.89.self_attn.q_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.self_attn.q_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.89.self_attn.v_proj.bias": "model-00090-of-00092.safetensors",
+ "model.layers.89.self_attn.v_proj.weight": "model-00090-of-00092.safetensors",
+ "model.layers.89.self_attn.v_proj.weight_scale": "model-00090-of-00092.safetensors",
+ "model.layers.9.input_layernorm.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.0.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.0.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.0.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.0.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.0.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.0.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.1.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.1.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.1.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.1.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.1.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.1.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.10.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.10.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.10.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.10.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.10.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.10.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.100.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.100.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.100.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.100.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.100.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.100.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.101.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.101.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.101.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.101.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.101.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.101.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.102.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.102.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.102.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.102.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.102.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.102.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.103.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.103.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.103.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.103.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.103.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.103.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.104.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.104.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.104.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.104.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.104.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.104.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.105.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.105.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.105.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.105.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.105.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.105.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.106.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.106.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.106.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.106.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.106.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.106.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.107.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.107.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.107.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.107.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.107.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.107.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.108.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.108.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.108.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.108.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.108.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.108.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.109.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.109.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.109.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.109.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.109.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.109.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.11.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.11.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.11.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.11.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.11.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.11.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.110.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.110.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.110.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.110.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.110.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.110.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.111.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.111.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.111.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.111.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.111.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.111.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.112.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.112.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.112.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.112.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.112.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.112.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.113.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.113.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.113.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.113.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.113.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.113.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.114.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.114.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.114.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.114.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.114.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.114.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.115.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.115.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.115.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.115.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.115.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.115.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.116.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.116.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.116.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.116.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.116.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.116.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.117.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.117.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.117.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.117.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.117.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.117.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.118.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.118.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.118.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.118.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.118.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.118.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.119.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.119.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.119.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.119.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.119.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.119.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.12.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.12.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.12.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.12.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.12.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.12.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.120.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.120.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.120.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.120.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.120.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.120.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.121.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.121.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.121.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.121.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.121.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.121.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.122.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.122.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.122.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.122.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.122.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.122.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.123.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.123.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.123.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.123.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.123.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.123.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.124.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.124.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.124.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.124.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.124.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.124.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.125.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.125.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.125.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.125.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.125.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.125.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.126.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.126.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.126.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.126.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.126.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.126.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.127.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.127.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.127.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.127.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.127.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.127.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.128.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.128.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.128.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.128.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.128.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.128.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.129.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.129.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.129.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.129.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.129.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.129.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.13.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.13.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.13.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.13.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.13.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.13.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.130.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.130.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.130.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.130.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.130.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.130.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.131.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.131.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.131.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.131.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.131.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.131.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.132.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.132.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.132.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.132.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.132.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.132.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.133.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.133.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.133.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.133.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.133.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.133.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.134.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.134.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.134.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.134.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.134.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.134.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.135.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.135.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.135.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.135.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.135.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.135.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.136.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.136.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.136.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.136.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.136.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.136.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.137.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.137.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.137.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.137.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.137.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.137.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.138.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.138.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.138.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.138.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.138.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.138.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.139.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.139.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.139.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.139.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.139.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.139.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.14.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.14.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.14.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.14.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.14.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.14.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.140.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.140.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.140.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.140.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.140.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.140.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.141.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.141.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.141.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.141.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.141.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.141.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.142.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.142.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.142.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.142.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.142.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.142.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.143.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.143.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.143.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.143.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.143.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.143.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.144.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.144.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.144.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.144.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.144.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.144.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.145.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.145.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.145.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.145.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.145.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.145.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.146.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.146.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.146.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.146.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.146.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.146.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.147.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.147.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.147.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.147.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.147.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.147.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.148.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.148.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.148.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.148.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.148.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.148.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.149.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.149.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.149.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.149.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.149.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.149.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.15.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.15.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.15.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.15.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.15.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.15.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.150.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.150.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.150.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.150.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.150.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.150.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.151.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.151.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.151.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.151.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.151.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.151.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.152.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.152.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.152.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.152.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.152.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.152.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.153.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.153.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.153.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.153.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.153.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.153.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.154.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.154.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.154.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.154.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.154.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.154.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.155.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.155.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.155.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.155.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.155.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.155.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.156.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.156.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.156.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.156.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.156.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.156.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.157.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.157.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.157.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.157.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.157.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.157.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.158.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.158.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.158.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.158.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.158.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.158.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.159.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.159.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.159.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.159.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.159.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.159.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.16.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.16.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.16.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.16.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.16.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.16.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.17.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.17.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.17.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.17.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.17.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.17.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.18.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.18.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.18.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.18.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.18.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.18.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.19.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.19.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.19.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.19.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.19.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.19.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.2.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.2.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.2.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.2.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.2.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.2.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.20.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.20.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.20.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.20.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.20.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.20.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.21.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.21.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.21.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.21.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.21.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.21.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.22.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.22.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.22.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.22.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.22.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.22.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.23.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.23.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.23.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.23.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.23.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.23.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.24.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.24.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.24.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.24.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.24.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.24.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.25.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.25.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.25.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.25.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.25.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.25.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.26.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.26.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.26.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.26.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.26.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.26.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.27.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.27.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.27.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.27.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.27.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.27.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.28.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.28.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.28.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.28.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.28.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.28.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.29.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.29.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.29.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.29.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.29.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.29.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.3.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.3.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.3.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.3.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.3.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.3.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.30.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.30.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.30.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.30.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.30.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.30.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.31.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.31.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.31.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.31.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.31.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.31.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.32.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.32.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.32.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.32.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.32.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.32.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.33.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.33.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.33.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.33.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.33.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.33.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.34.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.34.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.34.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.34.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.34.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.34.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.35.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.35.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.35.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.35.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.35.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.35.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.36.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.36.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.36.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.36.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.36.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.36.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.37.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.37.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.37.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.37.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.37.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.37.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.38.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.38.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.38.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.38.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.38.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.38.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.39.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.39.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.39.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.39.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.39.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.39.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.4.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.4.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.4.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.4.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.4.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.4.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.40.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.40.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.40.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.40.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.40.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.40.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.41.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.41.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.41.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.41.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.41.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.41.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.42.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.42.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.42.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.42.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.42.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.42.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.43.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.43.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.43.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.43.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.43.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.43.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.44.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.44.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.44.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.44.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.44.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.44.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.45.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.45.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.45.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.45.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.45.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.45.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.46.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.46.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.46.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.46.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.46.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.46.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.47.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.47.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.47.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.47.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.47.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.47.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.48.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.48.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.48.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.48.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.48.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.48.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.49.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.49.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.49.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.49.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.49.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.49.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.5.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.5.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.5.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.5.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.5.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.5.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.50.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.50.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.50.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.50.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.50.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.50.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.51.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.51.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.51.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.51.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.51.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.51.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.52.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.52.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.52.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.52.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.52.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.52.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.53.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.53.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.53.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.53.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.53.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.53.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.54.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.54.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.54.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.54.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.54.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.54.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.55.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.55.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.55.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.55.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.55.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.55.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.56.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.56.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.56.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.56.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.56.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.56.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.57.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.57.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.57.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.57.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.57.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.57.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.58.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.58.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.58.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.58.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.58.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.58.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.59.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.59.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.59.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.59.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.59.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.59.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.6.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.6.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.6.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.6.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.6.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.6.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.60.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.60.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.60.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.60.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.60.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.60.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.61.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.61.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.61.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.61.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.61.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.61.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.62.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.62.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.62.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.62.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.62.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.62.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.63.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.63.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.63.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.63.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.63.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.63.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.64.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.64.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.64.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.64.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.64.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.64.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.65.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.65.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.65.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.65.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.65.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.65.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.66.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.66.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.66.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.66.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.66.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.66.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.67.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.67.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.67.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.67.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.67.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.67.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.68.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.68.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.68.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.68.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.68.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.68.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.69.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.69.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.69.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.69.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.69.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.69.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.7.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.7.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.7.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.7.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.7.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.7.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.70.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.70.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.70.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.70.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.70.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.70.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.71.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.71.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.71.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.71.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.71.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.71.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.72.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.72.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.72.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.72.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.72.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.72.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.73.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.73.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.73.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.73.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.73.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.73.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.74.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.74.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.74.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.74.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.74.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.74.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.75.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.75.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.75.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.75.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.75.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.75.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.76.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.76.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.76.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.76.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.76.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.76.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.77.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.77.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.77.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.77.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.77.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.77.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.78.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.78.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.78.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.78.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.78.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.78.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.79.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.79.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.79.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.79.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.79.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.79.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.8.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.8.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.8.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.8.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.8.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.8.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.80.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.80.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.80.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.80.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.80.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.80.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.81.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.81.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.81.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.81.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.81.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.81.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.82.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.82.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.82.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.82.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.82.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.82.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.83.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.83.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.83.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.83.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.83.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.83.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.84.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.84.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.84.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.84.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.84.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.84.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.85.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.85.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.85.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.85.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.85.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.85.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.86.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.86.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.86.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.86.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.86.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.86.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.87.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.87.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.87.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.87.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.87.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.87.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.88.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.88.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.88.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.88.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.88.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.88.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.89.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.89.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.89.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.89.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.89.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.89.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.9.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.9.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.9.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.9.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.9.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.9.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.90.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.90.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.90.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.90.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.90.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.90.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.91.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.91.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.91.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.91.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.91.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.91.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.92.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.92.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.92.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.92.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.92.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.92.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.93.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.93.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.93.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.93.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.93.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.93.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.94.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.94.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.94.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.94.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.94.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.94.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.95.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.95.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.95.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.95.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.95.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.95.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.96.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.96.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.96.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.96.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.96.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.96.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.97.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.97.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.97.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.97.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.97.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.97.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.98.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.98.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.98.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.98.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.98.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.98.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.99.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.99.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.99.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.99.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.99.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.experts.99.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.gate.e_score_correction_bias": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.gate.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.shared_experts.down_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.shared_experts.down_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.shared_experts.gate_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.shared_experts.gate_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.shared_experts.up_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.mlp.shared_experts.up_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.post_attention_layernorm.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.self_attn.k_norm.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.self_attn.k_proj.bias": "model-00010-of-00092.safetensors",
+ "model.layers.9.self_attn.k_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.self_attn.k_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.self_attn.o_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.self_attn.o_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.self_attn.q_norm.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.self_attn.q_proj.bias": "model-00010-of-00092.safetensors",
+ "model.layers.9.self_attn.q_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.self_attn.q_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.9.self_attn.v_proj.bias": "model-00010-of-00092.safetensors",
+ "model.layers.9.self_attn.v_proj.weight": "model-00010-of-00092.safetensors",
+ "model.layers.9.self_attn.v_proj.weight_scale": "model-00010-of-00092.safetensors",
+ "model.layers.90.input_layernorm.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.0.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.0.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.0.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.0.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.0.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.0.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.1.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.1.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.1.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.1.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.1.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.1.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.10.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.10.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.10.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.10.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.10.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.10.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.100.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.100.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.100.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.100.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.100.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.100.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.101.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.101.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.101.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.101.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.101.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.101.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.102.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.102.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.102.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.102.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.102.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.102.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.103.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.103.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.103.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.103.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.103.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.103.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.104.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.104.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.104.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.104.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.104.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.104.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.105.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.105.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.105.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.105.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.105.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.105.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.106.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.106.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.106.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.106.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.106.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.106.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.107.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.107.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.107.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.107.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.107.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.107.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.108.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.108.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.108.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.108.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.108.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.108.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.109.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.109.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.109.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.109.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.109.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.109.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.11.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.11.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.11.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.11.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.11.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.11.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.110.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.110.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.110.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.110.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.110.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.110.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.111.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.111.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.111.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.111.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.111.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.111.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.112.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.112.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.112.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.112.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.112.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.112.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.113.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.113.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.113.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.113.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.113.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.113.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.114.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.114.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.114.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.114.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.114.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.114.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.115.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.115.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.115.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.115.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.115.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.115.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.116.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.116.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.116.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.116.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.116.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.116.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.117.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.117.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.117.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.117.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.117.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.117.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.118.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.118.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.118.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.118.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.118.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.118.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.119.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.119.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.119.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.119.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.119.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.119.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.12.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.12.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.12.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.12.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.12.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.12.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.120.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.120.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.120.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.120.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.120.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.120.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.121.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.121.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.121.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.121.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.121.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.121.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.122.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.122.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.122.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.122.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.122.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.122.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.123.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.123.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.123.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.123.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.123.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.123.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.124.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.124.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.124.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.124.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.124.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.124.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.125.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.125.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.125.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.125.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.125.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.125.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.126.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.126.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.126.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.126.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.126.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.126.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.127.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.127.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.127.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.127.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.127.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.127.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.128.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.128.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.128.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.128.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.128.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.128.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.129.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.129.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.129.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.129.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.129.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.129.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.13.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.13.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.13.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.13.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.13.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.13.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.130.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.130.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.130.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.130.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.130.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.130.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.131.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.131.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.131.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.131.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.131.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.131.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.132.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.132.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.132.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.132.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.132.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.132.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.133.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.133.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.133.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.133.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.133.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.133.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.134.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.134.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.134.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.134.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.134.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.134.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.135.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.135.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.135.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.135.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.135.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.135.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.136.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.136.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.136.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.136.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.136.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.136.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.137.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.137.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.137.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.137.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.137.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.137.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.138.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.138.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.138.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.138.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.138.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.138.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.139.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.139.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.139.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.139.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.139.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.139.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.14.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.14.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.14.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.14.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.14.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.14.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.140.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.140.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.140.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.140.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.140.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.140.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.141.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.141.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.141.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.141.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.141.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.141.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.142.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.142.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.142.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.142.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.142.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.142.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.143.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.143.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.143.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.143.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.143.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.143.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.144.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.144.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.144.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.144.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.144.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.144.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.145.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.145.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.145.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.145.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.145.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.145.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.146.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.146.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.146.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.146.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.146.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.146.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.147.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.147.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.147.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.147.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.147.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.147.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.148.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.148.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.148.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.148.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.148.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.148.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.149.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.149.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.149.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.149.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.149.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.149.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.15.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.15.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.15.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.15.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.15.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.15.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.150.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.150.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.150.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.150.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.150.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.150.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.151.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.151.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.151.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.151.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.151.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.151.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.152.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.152.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.152.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.152.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.152.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.152.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.153.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.153.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.153.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.153.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.153.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.153.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.154.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.154.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.154.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.154.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.154.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.154.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.155.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.155.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.155.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.155.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.155.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.155.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.156.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.156.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.156.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.156.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.156.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.156.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.157.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.157.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.157.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.157.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.157.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.157.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.158.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.158.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.158.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.158.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.158.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.158.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.159.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.159.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.159.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.159.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.159.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.159.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.16.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.16.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.16.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.16.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.16.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.16.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.17.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.17.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.17.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.17.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.17.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.17.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.18.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.18.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.18.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.18.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.18.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.18.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.19.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.19.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.19.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.19.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.19.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.19.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.2.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.2.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.2.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.2.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.2.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.2.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.20.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.20.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.20.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.20.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.20.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.20.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.21.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.21.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.21.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.21.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.21.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.21.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.22.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.22.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.22.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.22.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.22.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.22.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.23.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.23.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.23.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.23.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.23.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.23.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.24.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.24.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.24.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.24.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.24.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.24.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.25.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.25.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.25.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.25.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.25.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.25.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.26.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.26.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.26.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.26.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.26.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.26.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.27.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.27.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.27.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.27.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.27.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.27.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.28.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.28.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.28.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.28.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.28.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.28.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.29.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.29.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.29.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.29.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.29.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.29.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.3.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.3.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.3.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.3.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.3.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.3.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.30.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.30.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.30.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.30.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.30.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.30.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.31.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.31.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.31.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.31.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.31.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.31.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.32.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.32.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.32.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.32.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.32.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.32.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.33.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.33.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.33.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.33.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.33.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.33.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.34.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.34.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.34.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.34.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.34.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.34.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.35.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.35.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.35.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.35.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.35.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.35.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.36.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.36.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.36.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.36.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.36.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.36.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.37.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.37.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.37.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.37.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.37.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.37.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.38.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.38.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.38.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.38.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.38.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.38.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.39.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.39.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.39.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.39.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.39.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.39.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.4.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.4.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.4.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.4.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.4.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.4.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.40.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.40.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.40.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.40.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.40.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.40.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.41.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.41.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.41.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.41.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.41.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.41.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.42.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.42.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.42.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.42.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.42.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.42.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.43.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.43.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.43.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.43.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.43.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.43.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.44.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.44.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.44.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.44.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.44.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.44.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.45.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.45.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.45.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.45.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.45.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.45.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.46.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.46.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.46.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.46.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.46.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.46.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.47.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.47.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.47.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.47.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.47.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.47.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.48.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.48.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.48.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.48.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.48.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.48.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.49.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.49.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.49.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.49.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.49.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.49.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.5.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.5.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.5.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.5.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.5.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.5.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.50.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.50.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.50.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.50.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.50.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.50.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.51.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.51.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.51.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.51.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.51.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.51.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.52.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.52.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.52.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.52.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.52.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.52.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.53.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.53.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.53.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.53.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.53.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.53.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.54.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.54.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.54.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.54.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.54.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.54.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.55.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.55.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.55.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.55.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.55.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.55.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.56.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.56.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.56.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.56.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.56.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.56.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.57.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.57.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.57.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.57.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.57.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.57.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.58.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.58.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.58.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.58.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.58.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.58.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.59.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.59.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.59.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.59.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.59.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.59.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.6.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.6.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.6.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.6.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.6.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.6.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.60.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.60.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.60.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.60.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.60.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.60.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.61.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.61.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.61.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.61.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.61.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.61.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.62.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.62.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.62.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.62.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.62.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.62.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.63.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.63.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.63.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.63.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.63.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.63.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.64.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.64.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.64.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.64.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.64.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.64.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.65.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.65.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.65.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.65.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.65.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.65.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.66.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.66.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.66.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.66.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.66.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.66.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.67.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.67.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.67.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.67.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.67.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.67.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.68.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.68.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.68.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.68.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.68.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.68.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.69.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.69.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.69.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.69.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.69.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.69.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.7.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.7.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.7.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.7.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.7.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.7.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.70.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.70.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.70.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.70.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.70.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.70.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.71.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.71.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.71.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.71.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.71.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.71.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.72.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.72.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.72.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.72.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.72.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.72.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.73.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.73.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.73.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.73.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.73.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.73.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.74.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.74.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.74.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.74.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.74.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.74.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.75.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.75.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.75.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.75.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.75.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.75.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.76.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.76.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.76.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.76.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.76.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.76.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.77.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.77.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.77.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.77.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.77.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.77.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.78.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.78.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.78.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.78.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.78.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.78.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.79.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.79.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.79.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.79.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.79.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.79.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.8.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.8.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.8.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.8.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.8.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.8.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.80.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.80.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.80.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.80.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.80.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.80.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.81.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.81.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.81.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.81.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.81.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.81.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.82.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.82.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.82.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.82.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.82.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.82.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.83.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.83.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.83.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.83.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.83.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.83.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.84.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.84.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.84.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.84.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.84.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.84.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.85.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.85.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.85.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.85.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.85.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.85.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.86.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.86.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.86.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.86.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.86.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.86.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.87.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.87.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.87.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.87.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.87.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.87.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.88.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.88.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.88.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.88.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.88.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.88.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.89.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.89.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.89.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.89.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.89.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.89.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.9.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.9.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.9.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.9.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.9.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.9.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.90.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.90.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.90.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.90.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.90.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.90.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.91.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.91.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.91.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.91.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.91.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.91.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.92.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.92.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.92.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.92.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.92.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.92.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.93.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.93.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.93.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.93.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.93.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.93.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.94.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.94.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.94.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.94.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.94.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.94.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.95.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.95.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.95.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.95.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.95.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.95.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.96.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.96.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.96.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.96.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.96.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.96.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.97.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.97.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.97.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.97.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.97.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.97.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.98.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.98.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.98.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.98.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.98.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.98.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.99.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.99.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.99.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.99.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.99.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.experts.99.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.gate.e_score_correction_bias": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.gate.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.shared_experts.down_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.shared_experts.down_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.shared_experts.gate_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.shared_experts.gate_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.shared_experts.up_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.mlp.shared_experts.up_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.post_attention_layernorm.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.self_attn.k_norm.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.self_attn.k_proj.bias": "model-00091-of-00092.safetensors",
+ "model.layers.90.self_attn.k_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.self_attn.k_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.self_attn.o_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.self_attn.o_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.self_attn.q_norm.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.self_attn.q_proj.bias": "model-00091-of-00092.safetensors",
+ "model.layers.90.self_attn.q_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.self_attn.q_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.90.self_attn.v_proj.bias": "model-00091-of-00092.safetensors",
+ "model.layers.90.self_attn.v_proj.weight": "model-00091-of-00092.safetensors",
+ "model.layers.90.self_attn.v_proj.weight_scale": "model-00091-of-00092.safetensors",
+ "model.layers.91.input_layernorm.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.0.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.0.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.0.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.0.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.0.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.0.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.1.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.1.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.1.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.1.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.1.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.1.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.10.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.10.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.10.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.10.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.10.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.10.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.100.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.100.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.100.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.100.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.100.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.100.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.101.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.101.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.101.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.101.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.101.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.101.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.102.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.102.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.102.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.102.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.102.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.102.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.103.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.103.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.103.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.103.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.103.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.103.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.104.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.104.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.104.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.104.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.104.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.104.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.105.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.105.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.105.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.105.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.105.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.105.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.106.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.106.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.106.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.106.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.106.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.106.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.107.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.107.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.107.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.107.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.107.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.107.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.108.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.108.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.108.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.108.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.108.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.108.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.109.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.109.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.109.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.109.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.109.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.109.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.11.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.11.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.11.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.11.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.11.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.11.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.110.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.110.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.110.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.110.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.110.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.110.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.111.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.111.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.111.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.111.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.111.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.111.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.112.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.112.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.112.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.112.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.112.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.112.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.113.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.113.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.113.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.113.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.113.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.113.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.114.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.114.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.114.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.114.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.114.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.114.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.115.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.115.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.115.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.115.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.115.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.115.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.116.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.116.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.116.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.116.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.116.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.116.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.117.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.117.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.117.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.117.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.117.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.117.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.118.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.118.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.118.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.118.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.118.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.118.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.119.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.119.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.119.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.119.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.119.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.119.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.12.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.12.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.12.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.12.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.12.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.12.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.120.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.120.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.120.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.120.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.120.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.120.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.121.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.121.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.121.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.121.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.121.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.121.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.122.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.122.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.122.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.122.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.122.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.122.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.123.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.123.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.123.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.123.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.123.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.123.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.124.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.124.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.124.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.124.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.124.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.124.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.125.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.125.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.125.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.125.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.125.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.125.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.126.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.126.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.126.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.126.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.126.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.126.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.127.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.127.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.127.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.127.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.127.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.127.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.128.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.128.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.128.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.128.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.128.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.128.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.129.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.129.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.129.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.129.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.129.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.129.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.13.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.13.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.13.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.13.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.13.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.13.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.130.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.130.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.130.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.130.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.130.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.130.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.131.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.131.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.131.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.131.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.131.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.131.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.132.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.132.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.132.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.132.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.132.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.132.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.133.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.133.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.133.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.133.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.133.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.133.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.134.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.134.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.134.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.134.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.134.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.134.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.135.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.135.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.135.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.135.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.135.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.135.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.136.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.136.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.136.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.136.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.136.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.136.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.137.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.137.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.137.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.137.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.137.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.137.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.138.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.138.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.138.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.138.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.138.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.138.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.139.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.139.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.139.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.139.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.139.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.139.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.14.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.14.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.14.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.14.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.14.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.14.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.140.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.140.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.140.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.140.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.140.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.140.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.141.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.141.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.141.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.141.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.141.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.141.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.142.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.142.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.142.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.142.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.142.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.142.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.143.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.143.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.143.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.143.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.143.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.143.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.144.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.144.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.144.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.144.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.144.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.144.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.145.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.145.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.145.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.145.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.145.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.145.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.146.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.146.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.146.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.146.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.146.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.146.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.147.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.147.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.147.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.147.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.147.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.147.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.148.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.148.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.148.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.148.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.148.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.148.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.149.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.149.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.149.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.149.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.149.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.149.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.15.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.15.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.15.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.15.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.15.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.15.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.150.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.150.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.150.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.150.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.150.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.150.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.151.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.151.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.151.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.151.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.151.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.151.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.152.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.152.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.152.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.152.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.152.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.152.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.153.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.153.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.153.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.153.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.153.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.153.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.154.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.154.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.154.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.154.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.154.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.154.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.155.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.155.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.155.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.155.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.155.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.155.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.156.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.156.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.156.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.156.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.156.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.156.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.157.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.157.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.157.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.157.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.157.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.157.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.158.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.158.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.158.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.158.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.158.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.158.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.159.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.159.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.159.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.159.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.159.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.159.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.16.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.16.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.16.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.16.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.16.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.16.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.17.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.17.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.17.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.17.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.17.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.17.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.18.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.18.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.18.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.18.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.18.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.18.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.19.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.19.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.19.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.19.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.19.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.19.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.2.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.2.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.2.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.2.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.2.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.2.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.20.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.20.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.20.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.20.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.20.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.20.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.21.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.21.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.21.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.21.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.21.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.21.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.22.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.22.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.22.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.22.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.22.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.22.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.23.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.23.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.23.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.23.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.23.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.23.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.24.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.24.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.24.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.24.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.24.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.24.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.25.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.25.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.25.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.25.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.25.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.25.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.26.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.26.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.26.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.26.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.26.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.26.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.27.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.27.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.27.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.27.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.27.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.27.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.28.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.28.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.28.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.28.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.28.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.28.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.29.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.29.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.29.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.29.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.29.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.29.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.3.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.3.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.3.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.3.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.3.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.3.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.30.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.30.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.30.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.30.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.30.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.30.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.31.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.31.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.31.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.31.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.31.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.31.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.32.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.32.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.32.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.32.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.32.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.32.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.33.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.33.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.33.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.33.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.33.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.33.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.34.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.34.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.34.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.34.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.34.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.34.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.35.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.35.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.35.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.35.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.35.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.35.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.36.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.36.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.36.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.36.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.36.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.36.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.37.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.37.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.37.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.37.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.37.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.37.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.38.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.38.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.38.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.38.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.38.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.38.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.39.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.39.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.39.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.39.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.39.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.39.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.4.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.4.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.4.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.4.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.4.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.4.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.40.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.40.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.40.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.40.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.40.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.40.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.41.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.41.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.41.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.41.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.41.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.41.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.42.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.42.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.42.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.42.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.42.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.42.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.43.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.43.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.43.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.43.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.43.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.43.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.44.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.44.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.44.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.44.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.44.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.44.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.45.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.45.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.45.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.45.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.45.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.45.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.46.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.46.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.46.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.46.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.46.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.46.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.47.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.47.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.47.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.47.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.47.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.47.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.48.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.48.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.48.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.48.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.48.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.48.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.49.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.49.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.49.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.49.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.49.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.49.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.5.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.5.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.5.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.5.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.5.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.5.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.50.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.50.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.50.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.50.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.50.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.50.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.51.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.51.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.51.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.51.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.51.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.51.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.52.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.52.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.52.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.52.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.52.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.52.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.53.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.53.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.53.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.53.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.53.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.53.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.54.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.54.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.54.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.54.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.54.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.54.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.55.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.55.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.55.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.55.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.55.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.55.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.56.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.56.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.56.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.56.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.56.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.56.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.57.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.57.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.57.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.57.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.57.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.57.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.58.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.58.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.58.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.58.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.58.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.58.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.59.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.59.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.59.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.59.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.59.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.59.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.6.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.6.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.6.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.6.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.6.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.6.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.60.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.60.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.60.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.60.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.60.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.60.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.61.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.61.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.61.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.61.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.61.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.61.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.62.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.62.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.62.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.62.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.62.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.62.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.63.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.63.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.63.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.63.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.63.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.63.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.64.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.64.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.64.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.64.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.64.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.64.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.65.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.65.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.65.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.65.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.65.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.65.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.66.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.66.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.66.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.66.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.66.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.66.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.67.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.67.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.67.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.67.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.67.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.67.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.68.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.68.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.68.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.68.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.68.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.68.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.69.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.69.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.69.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.69.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.69.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.69.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.7.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.7.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.7.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.7.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.7.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.7.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.70.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.70.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.70.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.70.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.70.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.70.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.71.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.71.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.71.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.71.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.71.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.71.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.72.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.72.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.72.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.72.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.72.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.72.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.73.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.73.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.73.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.73.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.73.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.73.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.74.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.74.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.74.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.74.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.74.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.74.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.75.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.75.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.75.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.75.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.75.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.75.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.76.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.76.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.76.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.76.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.76.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.76.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.77.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.77.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.77.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.77.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.77.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.77.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.78.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.78.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.78.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.78.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.78.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.78.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.79.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.79.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.79.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.79.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.79.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.79.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.8.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.8.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.8.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.8.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.8.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.8.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.80.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.80.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.80.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.80.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.80.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.80.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.81.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.81.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.81.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.81.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.81.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.81.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.82.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.82.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.82.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.82.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.82.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.82.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.83.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.83.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.83.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.83.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.83.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.83.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.84.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.84.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.84.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.84.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.84.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.84.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.85.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.85.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.85.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.85.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.85.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.85.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.86.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.86.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.86.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.86.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.86.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.86.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.87.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.87.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.87.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.87.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.87.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.87.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.88.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.88.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.88.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.88.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.88.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.88.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.89.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.89.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.89.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.89.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.89.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.89.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.9.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.9.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.9.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.9.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.9.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.9.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.90.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.90.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.90.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.90.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.90.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.90.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.91.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.91.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.91.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.91.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.91.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.91.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.92.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.92.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.92.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.92.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.92.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.92.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.93.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.93.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.93.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.93.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.93.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.93.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.94.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.94.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.94.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.94.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.94.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.94.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.95.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.95.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.95.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.95.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.95.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.95.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.96.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.96.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.96.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.96.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.96.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.96.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.97.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.97.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.97.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.97.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.97.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.97.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.98.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.98.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.98.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.98.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.98.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.98.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.99.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.99.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.99.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.99.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.99.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.experts.99.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.gate.e_score_correction_bias": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.gate.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.shared_experts.down_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.shared_experts.down_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.shared_experts.gate_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.shared_experts.gate_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.shared_experts.up_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.mlp.shared_experts.up_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.post_attention_layernorm.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.self_attn.k_norm.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.self_attn.k_proj.bias": "model-00092-of-00092.safetensors",
+ "model.layers.91.self_attn.k_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.self_attn.k_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.self_attn.o_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.self_attn.o_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.self_attn.q_norm.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.self_attn.q_proj.bias": "model-00092-of-00092.safetensors",
+ "model.layers.91.self_attn.q_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.self_attn.q_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.91.self_attn.v_proj.bias": "model-00092-of-00092.safetensors",
+ "model.layers.91.self_attn.v_proj.weight": "model-00092-of-00092.safetensors",
+ "model.layers.91.self_attn.v_proj.weight_scale": "model-00092-of-00092.safetensors",
+ "model.layers.92.eh_proj.weight": "mtp.safetensors",
+ "model.layers.92.enorm.weight": "mtp.safetensors",
+ "model.layers.92.hnorm.weight": "mtp.safetensors",
+ "model.layers.92.input_layernorm.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.0.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.0.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.0.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.1.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.1.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.1.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.10.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.10.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.10.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.100.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.100.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.100.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.101.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.101.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.101.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.102.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.102.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.102.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.103.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.103.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.103.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.104.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.104.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.104.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.105.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.105.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.105.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.106.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.106.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.106.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.107.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.107.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.107.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.108.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.108.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.108.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.109.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.109.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.109.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.11.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.11.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.11.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.110.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.110.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.110.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.111.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.111.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.111.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.112.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.112.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.112.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.113.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.113.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.113.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.114.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.114.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.114.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.115.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.115.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.115.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.116.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.116.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.116.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.117.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.117.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.117.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.118.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.118.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.118.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.119.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.119.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.119.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.12.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.12.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.12.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.120.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.120.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.120.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.121.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.121.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.121.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.122.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.122.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.122.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.123.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.123.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.123.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.124.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.124.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.124.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.125.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.125.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.125.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.126.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.126.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.126.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.127.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.127.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.127.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.128.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.128.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.128.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.129.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.129.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.129.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.13.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.13.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.13.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.130.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.130.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.130.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.131.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.131.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.131.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.132.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.132.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.132.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.133.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.133.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.133.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.134.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.134.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.134.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.135.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.135.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.135.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.136.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.136.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.136.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.137.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.137.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.137.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.138.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.138.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.138.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.139.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.139.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.139.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.14.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.14.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.14.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.140.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.140.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.140.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.141.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.141.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.141.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.142.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.142.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.142.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.143.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.143.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.143.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.144.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.144.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.144.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.145.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.145.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.145.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.146.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.146.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.146.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.147.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.147.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.147.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.148.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.148.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.148.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.149.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.149.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.149.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.15.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.15.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.15.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.150.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.150.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.150.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.151.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.151.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.151.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.152.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.152.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.152.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.153.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.153.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.153.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.154.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.154.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.154.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.155.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.155.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.155.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.156.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.156.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.156.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.157.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.157.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.157.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.158.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.158.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.158.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.159.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.159.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.159.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.16.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.16.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.16.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.17.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.17.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.17.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.18.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.18.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.18.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.19.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.19.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.19.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.2.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.2.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.2.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.20.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.20.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.20.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.21.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.21.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.21.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.22.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.22.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.22.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.23.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.23.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.23.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.24.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.24.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.24.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.25.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.25.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.25.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.26.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.26.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.26.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.27.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.27.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.27.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.28.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.28.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.28.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.29.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.29.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.29.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.3.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.3.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.3.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.30.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.30.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.30.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.31.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.31.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.31.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.32.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.32.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.32.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.33.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.33.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.33.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.34.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.34.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.34.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.35.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.35.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.35.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.36.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.36.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.36.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.37.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.37.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.37.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.38.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.38.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.38.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.39.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.39.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.39.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.4.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.4.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.4.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.40.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.40.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.40.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.41.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.41.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.41.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.42.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.42.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.42.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.43.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.43.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.43.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.44.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.44.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.44.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.45.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.45.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.45.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.46.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.46.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.46.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.47.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.47.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.47.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.48.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.48.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.48.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.49.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.49.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.49.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.5.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.5.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.5.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.50.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.50.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.50.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.51.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.51.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.51.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.52.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.52.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.52.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.53.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.53.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.53.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.54.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.54.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.54.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.55.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.55.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.55.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.56.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.56.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.56.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.57.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.57.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.57.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.58.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.58.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.58.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.59.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.59.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.59.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.6.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.6.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.6.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.60.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.60.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.60.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.61.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.61.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.61.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.62.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.62.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.62.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.63.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.63.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.63.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.64.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.64.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.64.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.65.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.65.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.65.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.66.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.66.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.66.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.67.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.67.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.67.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.68.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.68.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.68.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.69.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.69.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.69.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.7.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.7.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.7.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.70.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.70.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.70.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.71.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.71.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.71.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.72.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.72.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.72.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.73.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.73.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.73.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.74.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.74.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.74.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.75.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.75.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.75.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.76.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.76.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.76.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.77.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.77.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.77.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.78.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.78.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.78.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.79.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.79.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.79.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.8.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.8.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.8.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.80.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.80.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.80.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.81.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.81.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.81.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.82.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.82.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.82.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.83.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.83.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.83.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.84.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.84.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.84.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.85.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.85.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.85.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.86.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.86.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.86.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.87.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.87.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.87.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.88.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.88.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.88.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.89.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.89.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.89.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.9.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.9.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.9.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.90.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.90.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.90.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.91.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.91.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.91.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.92.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.92.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.92.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.93.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.93.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.93.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.94.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.94.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.94.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.95.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.95.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.95.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.96.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.96.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.96.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.97.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.97.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.97.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.98.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.98.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.98.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.99.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.99.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.experts.99.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.gate.e_score_correction_bias": "mtp.safetensors",
+ "model.layers.92.mlp.gate.weight": "mtp.safetensors",
+ "model.layers.92.mlp.shared_experts.down_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.shared_experts.gate_proj.weight": "mtp.safetensors",
+ "model.layers.92.mlp.shared_experts.up_proj.weight": "mtp.safetensors",
+ "model.layers.92.post_attention_layernorm.weight": "mtp.safetensors",
+ "model.layers.92.self_attn.k_norm.weight": "mtp.safetensors",
+ "model.layers.92.self_attn.k_proj.bias": "mtp.safetensors",
+ "model.layers.92.self_attn.k_proj.weight": "mtp.safetensors",
+ "model.layers.92.self_attn.o_proj.weight": "mtp.safetensors",
+ "model.layers.92.self_attn.q_norm.weight": "mtp.safetensors",
+ "model.layers.92.self_attn.q_proj.bias": "mtp.safetensors",
+ "model.layers.92.self_attn.q_proj.weight": "mtp.safetensors",
+ "model.layers.92.self_attn.v_proj.bias": "mtp.safetensors",
+ "model.layers.92.self_attn.v_proj.weight": "mtp.safetensors",
+ "model.layers.92.shared_head.norm.weight": "mtp.safetensors",
+ "model.norm.weight": "model-00092-of-00092.safetensors"
+ }
+}
\ No newline at end of file
diff --git a/mtp.safetensors b/mtp.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..f5176f4a41901192f4a04fc830af6a21108903ff
--- /dev/null
+++ b/mtp.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:74a26e5f1245a153f3a9ab94219266aeb632e9dd90ce63fbada1a8c39f47924b
+size 7976202392
diff --git a/tokenizer.json b/tokenizer.json
new file mode 100644
index 0000000000000000000000000000000000000000..43a71efad1ab3f7e4d66d1e48e7cc44f68f21f3a
--- /dev/null
+++ b/tokenizer.json
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9340665016419c825c4bdabbcc9acc43b7ca2c68ce142724afa829abb1be5efd
+size 19970699
diff --git a/tokenizer_config.json b/tokenizer_config.json
new file mode 100644
index 0000000000000000000000000000000000000000..053f12c9b03d5acbcc921042ea0c87a6baa5d3f7
--- /dev/null
+++ b/tokenizer_config.json
@@ -0,0 +1,325 @@
+{
+ "added_tokens_decoder": {
+ "151329": {
+ "content": "<|endoftext|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151330": {
+ "content": "[MASK]",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151331": {
+ "content": "[gMASK]",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151332": {
+ "content": "[sMASK]",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151333": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151334": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151335": {
+ "content": "<|system|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151336": {
+ "content": "<|user|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151337": {
+ "content": "<|assistant|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151338": {
+ "content": "<|observation|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151339": {
+ "content": "<|begin_of_image|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151340": {
+ "content": "<|end_of_image|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151341": {
+ "content": "<|begin_of_video|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151342": {
+ "content": "<|end_of_video|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151343": {
+ "content": "<|begin_of_audio|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151344": {
+ "content": "<|end_of_audio|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151345": {
+ "content": "<|begin_of_transcription|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151346": {
+ "content": "<|end_of_transcription|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151347": {
+ "content": "<|code_prefix|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151348": {
+ "content": "<|code_middle|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151349": {
+ "content": "<|code_suffix|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151350": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151351": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151352": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151353": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151354": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151355": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151356": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151357": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151358": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151359": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151360": {
+ "content": "/nothink",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151361": {
+ "content": "<|begin_of_box|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151362": {
+ "content": "<|end_of_box|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151363": {
+ "content": "<|image|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151364": {
+ "content": "<|video|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ }
+ },
+ "additional_special_tokens": [
+ "<|endoftext|>",
+ "[MASK]",
+ "[gMASK]",
+ "[sMASK]",
+ "",
+ "",
+ "<|system|>",
+ "<|user|>",
+ "<|assistant|>",
+ "<|observation|>",
+ "<|begin_of_image|>",
+ "<|end_of_image|>",
+ "<|begin_of_video|>",
+ "<|end_of_video|>",
+ "<|begin_of_audio|>",
+ "<|end_of_audio|>",
+ "<|begin_of_transcription|>",
+ "<|end_of_transcription|>",
+ "<|code_prefix|>",
+ "<|code_middle|>",
+ "<|code_suffix|>",
+ "/nothink"
+ ],
+ "clean_up_tokenization_spaces": false,
+ "do_lower_case": false,
+ "eos_token": "<|endoftext|>",
+ "extra_special_tokens": {},
+ "model_max_length": 128000,
+ "pad_token": "<|endoftext|>",
+ "padding_side": "left",
+ "remove_space": false,
+ "tokenizer_class": "PreTrainedTokenizer"
+}